Spaces:

athurlow
/

qcal

Running

qcal / app.py

Claude

Patch `_json_schema_to_python_type` too, not just `get_type`

6e8f79b unverified 19 days ago

11.7 kB

	"""QCal Copilot — Gradio MVP.

	Upload a calibration plot (image) or CSV, get an AI analysis from the
	Ising Calibration VLM, generate a runnable CUDA-Q script, execute it on
	the local cudaq simulator, and optionally run the Ising 3D CNN decoder
	stage on a synthetic surface-code syndrome volume.

	Run:
	python app.py

	Environment (optional):
	NVIDIA_API_KEY API key for build.nvidia.com NIM endpoint
	QCAL_MODEL_ID HF model id for the calibration VLM
	QCAL_NIM_MODEL NIM model name
	QCAL_NIM_ENDPOINT NIM base URL
	QCAL_DECODER_FAST_ID Override fast decoder HF id
	QCAL_DECODER_ACCURATE_ID Override accurate decoder HF id
	"""

	from __future__ import annotations

	import os
	import sys
	from pathlib import Path

	# On HF Spaces the build step only mounts requirements.txt, so `pip install -e .`
	# can't reach pyproject.toml. Put src/ on sys.path so `from qcal import ...`
	# resolves against the src-layout package without needing it installed.
	_SRC = Path(__file__).resolve().parent / "src"
	if _SRC.is_dir() and str(_SRC) not in sys.path:
	sys.path.insert(0, str(_SRC))

	# gradio 4.44.0 crashes on every page load when a JSON sub-schema is a bool
	# (JSON Schema draft 2020-12 allows `additionalProperties: True\|False`, and
	# pydantic emits it). Fixed in 4.44.1, but HF Spaces pins 4.44.0 in its
	# build bootstrap. Wrap both the schema walker and the type dispatcher so
	# bool schemas degrade to "Any" instead of raising APIInfoParseError.
	# Recursion inside gradio_client.utils resolves these names via module
	# globals, so patching the module attributes intercepts every call site.
	try:
	from gradio_client import utils as _gc_utils

	_orig_walk = _gc_utils._json_schema_to_python_type
	_orig_get_type = _gc_utils.get_type

	def _safe_walk(schema, defs=None):
	if isinstance(schema, bool):
	return "Any"
	return _orig_walk(schema, defs)

	def _safe_get_type(schema):
	if not isinstance(schema, dict):
	return "Any"
	return _orig_get_type(schema)

	_gc_utils._json_schema_to_python_type = _safe_walk
	_gc_utils.get_type = _safe_get_type
	except Exception: # noqa: BLE001 — best-effort; don't block startup
	pass

	import gradio as gr

	from qcal import analyzer, codegen, data, decoder, simulator


	# ---------------------------------------------------------------------------
	# Pipeline steps — each step is a pure-ish function Gradio wires together.
	# ---------------------------------------------------------------------------

	def step_analyze(file_obj, backend_choice: str):
	"""Load the file, call the VLM, and prepare the follow-on script."""
	if file_obj is None:
	return (
	gr.update(value="Please upload an image or CSV first."),
	gr.update(value=""),
	gr.update(value=""),
	None,
	gr.update(value=decoder.suggest_error_rate(None)),
	)

	try:
	payload = data.load_payload(file_obj.name if hasattr(file_obj, "name") else file_obj)
	except Exception as exc: # noqa: BLE001
	return (
	gr.update(value=f"Input error: {exc}"),
	"", "", None,
	gr.update(value=decoder.suggest_error_rate(None)),
	)

	summary = payload.summary()
	table_md = payload.table_preview_markdown() if payload.kind == "csv" else None

	result = analyzer.analyze(
	image=payload.image,
	source=payload.source_name or "upload",
	table_preview=table_md,
	backend=backend_choice,
	)

	header = f"### Input\n{summary}\n\n### Analysis\n"
	analysis_md = header + result.markdown()

	script = codegen.generate_script(result.parsed) if result.ok else ""
	script_hint = "" if result.ok else "_(no script generated — fix the analysis error first)_"
	suggested_p = decoder.suggest_error_rate(result.parsed)

	return analysis_md, script, script_hint, result.parsed, gr.update(value=suggested_p)


	def step_run_simulation(script_text: str):
	if not script_text.strip():
	return "_No script to run yet. Analyze a file first._"
	result = simulator.run_script(script_text)
	return simulator.format_result_markdown(result)


	def step_run_decoder(
	variant: str,
	distance: int,
	rounds: int,
	error_rate: float,
	n_shots: int,
	analysis: dict \| None,
	script_text: str,
	):
	"""Run the Ising 3D CNN decoder and refresh metrics/plots/script."""
	result = decoder.run_decoder(
	variant=variant,
	distance=int(distance),
	rounds=int(rounds),
	error_rate=float(error_rate),
	n_shots=int(n_shots),
	)
	metrics_md = result.markdown()

	try:
	fig = decoder.plot_comparison(result) if result.ok else None
	except Exception as exc: # noqa: BLE001
	fig = None
	metrics_md += f"\n\n_(plot unavailable: {exc})_"

	# Re-generate the CUDA-Q script with a decoder header block, so the user
	# can copy a script that documents which decoder ran upstream.
	new_script = script_text
	if result.ok and analysis:
	decoder_info = {
	"variant": result.variant,
	"model_id": result.model_id,
	"distance": result.distance,
	"rounds": result.rounds,
	"density_reduction": result.density_reduction,
	"ler_improvement": result.ler_improvement,
	}
	new_script = codegen.generate_script(analysis, decoder_info=decoder_info)

	return metrics_md, fig, new_script


	# ---------------------------------------------------------------------------
	# UI
	# ---------------------------------------------------------------------------

	CSS = """
	#qcal-header { text-align: center; }
	#qcal-header h1 { margin-bottom: 0; }
	#qcal-header p { margin-top: 4px; color: var(--body-text-color-subdued); }
	footer { visibility: hidden; }
	"""


	def build_ui() -> gr.Blocks:
	default_backend = "nim" if os.getenv("NVIDIA_API_KEY") or os.getenv("NIM_API_KEY") else "local"

	with gr.Blocks(title="QCal Copilot", css=CSS, theme=gr.themes.Soft()) as demo:
	gr.Markdown(
	"""
	<div id="qcal-header">
	<h1>QCal Copilot</h1>
	<p>AI-assisted quantum calibration · Ising VLM + 3D CNN decoder + CUDA-Q</p>
	</div>
	"""
	)

	# State holds the parsed analysis dict so downstream stages (decoder,
	# future 3D CNN tile, etc.) can read it without re-calling the VLM.
	analysis_state = gr.State(value=None)

	# ---- Stage 1: calibration analysis ---------------------------------
	with gr.Row():
	with gr.Column(scale=1):
	file_in = gr.File(
	label="Upload calibration plot or CSV",
	file_types=[
	".png", ".jpg", ".jpeg", ".bmp", ".tiff", ".webp",
	".csv", ".tsv",
	],
	)
	backend_choice = gr.Radio(
	label="Inference backend",
	choices=["auto", "nim", "local"],
	value="auto",
	info=(
	f"Auto-detected default: {default_backend}. "
	"Use `nim` for build.nvidia.com, `local` for Hugging Face."
	),
	)
	analyze_btn = gr.Button("Analyze calibration", variant="primary")
	run_btn = gr.Button("Run simulation")
	gr.Markdown(
	"Tip: set `NVIDIA_API_KEY` to use the NIM endpoint without "
	"downloading the 35B model locally."
	)

	with gr.Column(scale=2):
	analysis_out = gr.Markdown(label="Analysis")
	with gr.Accordion("Generated CUDA-Q script", open=True):
	script_out = gr.Code(
	language="python",
	label="cudaq script (editable before running)",
	value="",
	)
	script_hint = gr.Markdown()
	sim_out = gr.Markdown(label="Simulation result")

	# ---- Stage 2: error-correction decoder -----------------------------
	with gr.Accordion("Error-correction decoder (Ising 3D CNN)", open=False):
	gr.Markdown(
	"Sparsify a synthetic surface-code syndrome volume with one of "
	"the Ising pre-decoders, then hand off to MWPM (PyMatching). "
	"Error rate defaults are suggested from your calibration analysis."
	)
	with gr.Row():
	with gr.Column(scale=1):
	variant_choice = gr.Radio(
	label="Decoder variant",
	choices=[decoder.VARIANT_FAST, decoder.VARIANT_ACCURATE],
	value=decoder.VARIANT_FAST,
	info=(
	"`fast` ≈ 912k params — lower latency. "
	"`accurate` ≈ 1.79M params — better LER."
	),
	)
	distance_slider = gr.Slider(
	3, 11, value=5, step=2,
	label="Code distance (d)",
	)
	rounds_slider = gr.Slider(
	1, 17, value=5, step=1,
	label="Syndrome rounds (T)",
	)
	error_rate_slider = gr.Slider(
	0.0, 0.05, value=0.005, step=0.001,
	label="Physical error rate (p)",
	)
	shots_slider = gr.Slider(
	16, 1024, value=128, step=16,
	label="Shots",
	)
	run_decoder_btn = gr.Button(
	"Run decoder", variant="primary"
	)

	with gr.Column(scale=2):
	decoder_metrics = gr.Markdown(
	"_Run the decoder to see density reduction, MWPM timing, "
	"and LER-proxy improvement here._"
	)
	decoder_plot = gr.Plot(label="Raw vs denoised syndromes")

	analyze_btn.click(
	fn=step_analyze,
	inputs=[file_in, backend_choice],
	outputs=[
	analysis_out, script_out, script_hint, analysis_state,
	error_rate_slider,
	],
	)
	run_btn.click(
	fn=step_run_simulation,
	inputs=[script_out],
	outputs=[sim_out],
	)
	run_decoder_btn.click(
	fn=step_run_decoder,
	inputs=[
	variant_choice, distance_slider, rounds_slider,
	error_rate_slider, shots_slider, analysis_state, script_out,
	],
	outputs=[decoder_metrics, decoder_plot, script_out],
	)

	return demo


	def main() -> None:
	demo = build_ui()
	demo.queue(max_size=8).launch(
	server_name=os.getenv("QCAL_HOST", "0.0.0.0"),
	server_port=int(os.getenv("QCAL_PORT", "7860")),
	share=os.getenv("QCAL_SHARE", "").lower() in {"1", "true", "yes"},
	# Gradio 4.44.0's client-side schema serializer crashes on
	# `additionalProperties: False` ("argument of type 'bool' is not
	# iterable"); fixed in 4.44.1, but HF Spaces pins 4.44.0. Disabling
	# the OpenAPI endpoint avoids the crash — the UI is unaffected.
	show_api=False,
	)


	if __name__ == "__main__":
	main()