Spaces:

lablab-ai-amd-developer-hackathon
/

glitch-squad-biomedical-assistant

Running

glitch-squad-biomedical-assistant / app.py

azlaan428

Update Flask port for HuggingFace Spaces

0fa412c 4 days ago

13.5 kB

	import sys, os, json, time
	sys.path.append(os.path.dirname(os.path.abspath(__file__)))
	from flask import Flask, render_template, request, jsonify, send_file, Response, stream_with_context
	from agent.agent import (run_pipeline, run_query_architect, run_literature_scout,
	run_evidence_synthesiser, run_citation_builder, llm_invoke_with_retry, get_llm)
	from reportlab.lib.pagesizes import A4
	from reportlab.lib.styles import getSampleStyleSheet, ParagraphStyle
	from reportlab.lib.units import mm
	from reportlab.lib import colors
	from reportlab.platypus import SimpleDocTemplate, Paragraph, Spacer, HRFlowable
	from reportlab.lib.enums import TA_LEFT
	import io

	app = Flask(__name__)

	@app.route("/")
	def index():
	return render_template("index.html")

	@app.route("/query", methods=["POST"])
	def query():
	data = request.get_json()
	user_query = data.get("query", "").strip()
	if not user_query:
	return jsonify({"error": "Empty query"}), 400
	try:
	result = run_pipeline(user_query)
	return jsonify({
	"synthesis": result["synthesis"],
	"citations": result["citations"],
	"paper_count": result["paper_count"],
	"queries": result["queries"]
	})
	except Exception as e:
	return jsonify({"error": str(e)}), 500

	@app.route("/stream", methods=["GET"])
	def stream():
	user_query = request.args.get("query", "").strip()
	if not user_query:
	return jsonify({"error": "Empty query"}), 400

	def generate():
	def emit(event, data):
	return "event: " + event + "\ndata: " + json.dumps(data) + "\n\n"

	try:
	# Stage 1
	yield emit("stage", {"stage": 1, "pct": 10})
	queries = run_query_architect(user_query)
	yield emit("queries", {"queries": queries, "pct": 25})

	# Stage 2
	yield emit("stage", {"stage": 2, "pct": 35})
	papers = run_literature_scout(queries)
	yield emit("papers", {"paper_count": len(papers), "pct": 50})

	# PRISMA filter
	yield emit("stage", {"stage": 3, "pct": 55})
	from agent.agent import run_prisma_filter
	filtered = run_prisma_filter(user_query, papers)
	included = {pmid: p for pmid, p in filtered.items() if p["included"]}
	yield emit("prisma", {
	"filtered": {
	pmid: {"title": p.get("title", ""), "included": p["included"], "reason": p["reason"]}
	for pmid, p in filtered.items()
	},
	"included_count": len(included),
	"excluded_count": len(filtered) - len(included),
	"pct": 65
	})
	time.sleep(12)

	# Stage 4 - synthesise on included papers only
	yield emit("stage", {"stage": 4, "pct": 70})
	synthesis = run_evidence_synthesiser(user_query, included)
	yield emit("synthesis", {"synthesis": synthesis, "pct": 88})

	# Stage 5
	yield emit("stage", {"stage": 5, "pct": 90})
	citations = run_citation_builder(included)
	yield emit("done", {
	"synthesis": synthesis,
	"citations": citations,
	"paper_count": len(included),
	"queries": queries,
	"papers": {
	pmid: {
	"title": p.get("title", ""),
	"abstract": p.get("abstract", ""),
	"authors": p.get("authors", ""),
	"journal": p.get("journal", ""),
	"year": p.get("year", "")
	} for pmid, p in included.items()
	},
	"pct": 100
	})

	except Exception as e:
	yield emit("error", {"message": str(e)})

	return Response(
	stream_with_context(generate()),
	mimetype="text/event-stream",
	headers={
	"Cache-Control": "no-cache",
	"X-Accel-Buffering": "no"
	}
	)

	@app.route("/suggest-queries", methods=["POST"])
	def suggest_queries():
	data = request.get_json()
	original_query = data.get("query", "")
	synthesis = data.get("synthesis", "")
	if not synthesis:
	return jsonify({"error": "No synthesis provided"}), 400
	try:
	llm = get_llm()
	prompt = (
	f"You are a biomedical research strategist. A researcher asked:\n\"{original_query}\"\n\n"
	f"Based on this evidence synthesis, identify 3 high-value follow-up research questions "
	f"that would fill gaps or extend the findings. Return ONLY a JSON array of 3 strings, "
	f"each a specific, searchable research question. No preamble, no markdown, just the JSON array.\n\n"
	f"Synthesis excerpt:\n{synthesis[:1200]}"
	)
	response = llm_invoke_with_retry(llm, prompt)
	raw = response.content.strip()
	# Strip markdown fences if present
	if raw.startswith("```"):
	raw = raw.split("```")[1]
	if raw.startswith("json"):
	raw = raw[4:]
	suggestions = json.loads(raw.strip())
	if not isinstance(suggestions, list):
	suggestions = []
	return jsonify({"suggestions": suggestions[:3]})
	except Exception as e:
	return jsonify({"error": str(e)}), 500

	@app.route("/export-pdf", methods=["POST"])
	def export_pdf():
	data = request.get_json()
	synthesis = data.get("synthesis", "")
	citations = data.get("citations", "")
	query = data.get("query", "Biomedical Research Query")
	paper_count = data.get("paper_count", 0)

	buf = io.BytesIO()
	doc = SimpleDocTemplate(buf, pagesize=A4,
	leftMargin=20mm, rightMargin=20mm,
	topMargin=20mm, bottomMargin=20mm)

	accent = colors.HexColor("#00e5a0")
	dark = colors.HexColor("#111827")

	title_style = ParagraphStyle("title",
	fontName="Helvetica-Bold", fontSize=18,
	textColor=dark, spaceAfter=4)
	meta_style = ParagraphStyle("meta",
	fontName="Helvetica", fontSize=9,
	textColor=colors.HexColor("#5a6a7a"), spaceAfter=16)
	section_label_style = ParagraphStyle("sec_label",
	fontName="Helvetica-Bold", fontSize=10,
	textColor=accent, spaceBefore=14, spaceAfter=4)
	body_style = ParagraphStyle("body",
	fontName="Helvetica", fontSize=10,
	leading=16, textColor=dark, spaceAfter=6)
	cite_style = ParagraphStyle("cite",
	fontName="Helvetica", fontSize=8,
	leading=13, textColor=colors.HexColor("#444444"),
	spaceAfter=4)

	story = []
	story.append(Paragraph("ARIA — Autonomous Research Intelligence Agent", title_style))
	story.append(Paragraph(
	"Query: " + query + " \| " + str(paper_count) + " papers retrieved \| Groq LLaMA-3.1",
	meta_style))
	story.append(HRFlowable(width="100%", thickness=1,
	color=colors.HexColor("#1e2936"), spaceAfter=16))

	SECTIONS = [
	("## Background", "Background"),
	("## Key Findings", "Key Findings"),
	("## Level of Evidence", "Level of Evidence"),
	("## Conflicting Evidence", "Conflicting Evidence"),
	("## Research Gaps", "Research Gaps"),
	("## Clinical Implications", "Clinical Implications"),
	]
	for marker, label in SECTIONS:
	start = synthesis.find(marker)
	if start == -1:
	continue
	content_start = start + len(marker)
	next_markers = [synthesis.find(m) for m, _ in SECTIONS if synthesis.find(m) > start]
	end = min(next_markers) if next_markers else len(synthesis)
	text = synthesis[content_start:end].strip()
	if not text:
	continue
	story.append(Paragraph(label.upper(), section_label_style))
	for para in text.split("\n"):
	para = para.strip()
	if para:
	story.append(Paragraph(para, body_style))

	story.append(Spacer(1, 8*mm))
	story.append(HRFlowable(width="100%", thickness=1,
	color=colors.HexColor("#1e2936"), spaceAfter=8))
	story.append(Paragraph("REFERENCES", section_label_style))
	for line in citations.split("\n"):
	line = line.strip()
	if line:
	story.append(Paragraph(line, cite_style))

	story.append(Spacer(1, 6*mm))
	story.append(Paragraph(
	"AI-generated synthesis — verify against primary sources before clinical use.",
	ParagraphStyle("disclaimer", fontName="Helvetica-Oblique",
	fontSize=8, textColor=colors.HexColor("#999999"))))

	doc.build(story)
	buf.seek(0)
	safe_query = "".join(c for c in query[:40] if c.isalnum() or c in " -_").strip()
	filename = "ARIA_" + safe_query.replace(" ", "_") + ".pdf"
	return send_file(buf, mimetype="application/pdf",
	as_attachment=True, download_name=filename)

	@app.route("/score", methods=["POST"])
	def score():
	data = request.get_json()
	synthesis = data.get("synthesis", "")
	if not synthesis:
	return jsonify({"error": "No synthesis provided"}), 400
	try:
	from agent.agent import run_confidence_scorer
	scores = run_confidence_scorer(synthesis)
	return jsonify({"scores": scores})
	except Exception as e:
	return jsonify({"error": str(e)}), 500

	@app.route("/selective-review", methods=["POST"])
	def selective_review():
	data = request.get_json()
	question = data.get("question", "")
	selected_papers = data.get("papers", {})
	if not selected_papers:
	return jsonify({"error": "No papers selected"}), 400
	try:
	from agent.agent import run_selective_review
	review = run_selective_review(question, selected_papers)
	return jsonify({"review": review})
	except Exception as e:
	return jsonify({"error": str(e)}), 500

	@app.route("/predict", methods=["POST"])
	def predict():
	data = request.get_json()
	question = data.get("question", "")
	synthesis = data.get("synthesis", "")
	if not synthesis:
	return jsonify({"error": "No synthesis provided"}), 400
	try:
	from agent.agent import run_predictive_model
	prediction = run_predictive_model(question, synthesis)
	return jsonify({"prediction": prediction})
	except Exception as e:
	return jsonify({"error": str(e)}), 500

	import json as _json
	from datetime import datetime
	SESSIONS_FILE = os.path.join(os.path.dirname(os.path.abspath(__file__)), "sessions.json")

	def load_sessions():
	try:
	return _json.load(open(SESSIONS_FILE))
	except:
	return []

	def save_session(entry):
	sessions = load_sessions()
	sessions.insert(0, entry)
	sessions = sessions[:20]
	_json.dump(sessions, open(SESSIONS_FILE, "w"), indent=2)

	@app.route("/sessions", methods=["GET"])
	def get_sessions():
	return jsonify({"sessions": load_sessions()})

	@app.route("/sessions/save", methods=["POST"])
	def save_session_route():
	data = request.get_json()
	save_session({
	"id": datetime.now().strftime("%Y%m%d%H%M%S"),
	"timestamp": datetime.now().strftime("%b %d, %H:%M"),
	"query": data.get("query", ""),
	"synthesis": data.get("synthesis", ""),
	"citations": data.get("citations", ""),
	"paper_count": data.get("paper_count", 0),
	"queries": data.get("queries", []),
	"papers": data.get("papers", {})
	})
	return jsonify({"ok": True})

	@app.route("/extract-table", methods=["POST"])
	def extract_table():
	data = request.get_json()
	question = data.get("question", "")
	synthesis = data.get("synthesis", "")
	papers = data.get("papers", {})
	if not synthesis:
	return jsonify({"error": "No synthesis provided"}), 400
	try:
	from agent.agent import run_table_extractor
	table = run_table_extractor(question, synthesis, papers)
	return jsonify({"table": table})
	except Exception as e:
	import traceback
	traceback.print_exc()
	return jsonify({"error": str(e)}), 500

	@app.route("/followup", methods=["POST"])
	def followup():
	data = request.get_json()
	question = data.get("question", "")
	original_question = data.get("original_question", "")
	synthesis = data.get("synthesis", "")
	papers = data.get("papers", {})
	if not question or not synthesis:
	return jsonify({"error": "Missing question or synthesis"}), 400
	try:
	llm = get_llm()
	corpus = "\n\n".join(
	f"[PMID {pmid}] {p.get('title','')}\n{p.get('abstract','')[:300]}"
	for pmid, p in list(papers.items())[:6]
	)
	prompt = (
	f"You are a biomedical research assistant. The user previously asked:\n"
	f"\"{original_question}\"\n\n"
	f"Based on this evidence synthesis and retrieved papers, answer their follow-up question.\n"
	f"Be concise and cite PMIDs where relevant.\n\n"
	f"Synthesis:\n{synthesis[:1500]}\n\n"
	f"Papers:\n{corpus}\n\n"
	f"Follow-up Question: {question}"
	)
	response = llm_invoke_with_retry(llm, prompt)
	return jsonify({"answer": response.content})
	except Exception as e:
	return jsonify({"error": str(e)}), 500

	if __name__ == "__main__":
	port = int(os.environ.get("PORT", 7860))
	app.run(host="0.0.0.0", port=port, debug=False, threaded=True)