Spaces:

wehe1pwe
/

math-under-llm

Running

Alex W.

Models analyzed after app startup did not appear in the Tab 6 model selector.

5827b27 8 days ago

14.1 kB

	# ui/tab_tables.py
	"""
	Tab6: Tables — Paper-ready table generation for Wang's Five Laws.
	Data: language modality, standard layers only, from SQLite DB.
	Output: Gradio DataFrames + LaTeX + Markdown + CSV downloads.
	"""

	import io
	import os
	import zipfile
	import tempfile

	import gradio as gr
	import pandas as pd

	from db.schema import init_db
	from db.reader import get_layer_metrics, get_analyzed_models
	from core.table_gen import (
	generate_all_tables,
	format_all_latex,
	format_all_markdown,
	TABLE_META,
	)

	_OUT_DIR = "/tmp/wang_tables"
	os.makedirs(_OUT_DIR, exist_ok=True)


	# ─────────────────────────────────────────────────────────────────────────────
	# DB helpers
	# ─────────────────────────────────────────────────────────────────────────────

	def _get_model_choices() -> list[str]:
	try:
	conn = init_db()
	df = get_analyzed_models(conn)
	return df["model_id"].tolist() if not df.empty else []
	except Exception:
	return []


	def _load_all_models(choices: list[str]) -> dict[str, pd.DataFrame]:
	"""Load language-modality standard-layer data for all selected models."""
	conn = init_db()
	out = {}
	for mid in choices:
	df = get_layer_metrics(
	conn,
	model_id = mid,
	modality = "language",
	layer_type = None, # keep both; table_gen filters internally
	start_layer= 0,
	end_layer = 9999,
	)
	if not df.empty:
	out[mid] = df
	return out


	def _parse_groups(text: str) -> list[tuple[int, int]]:
	"""
	Parse user-defined layer groups.
	Format: "0-11, 12-23, 24-35, 36-47"
	Returns list of (lo, hi) tuples.
	"""
	groups = []
	for part in text.split(","):
	part = part.strip()
	if "-" in part:
	try:
	lo_s, hi_s = part.split("-", 1)
	groups.append((int(lo_s.strip()), int(hi_s.strip())))
	except ValueError:
	continue
	return groups if groups else [(0, 11), (12, 23), (24, 35), (36, 47)]


	def _save_csv(df: pd.DataFrame, name: str) -> str:
	path = os.path.join(_OUT_DIR, f"{name}.csv")
	df.to_csv(path, index=False)
	return path


	def _make_zip(paths: list[str]) -> str:
	zp = os.path.join(_OUT_DIR, "wang_laws_tables.zip")
	with zipfile.ZipFile(zp, "w", zipfile.ZIP_DEFLATED) as zf:
	for p in paths:
	if p and os.path.exists(p):
	zf.write(p, os.path.basename(p))
	return zp


	def _save_text(content: str, name: str) -> str:
	path = os.path.join(_OUT_DIR, name)
	with open(path, "w", encoding="utf-8") as f:
	f.write(content)
	return path


	# ─────────────────────────────────────────────────────────────────────────────
	# Main generation function
	# ─────────────────────────────────────────────────────────────────────────────

	def generate_tables(
	selected_models: list[str],
	table2_model_a: str,
	table2_model_b: str,
	group_text: str,
	progress=gr.Progress(),
	):
	"""
	Returns:
	status, t1_df, t2_df, t3_df, t4_df, t5_df, t6_df,
	latex_text, md_text,
	csv_t1, csv_t2, csv_t3, csv_t4, csv_t5, csv_t6,
	latex_file, md_file, zip_file
	"""
	EMPTY = tuple([None] * 17)

	if not selected_models:
	return ("❌ Please select at least one model.",) + EMPTY[1:]

	progress(0.05, desc="Loading data from DB...")
	model_dfs = _load_all_models(selected_models)

	if not model_dfs:
	return ("❌ No language-modality data found. Run Tab 2 analysis first.",) + EMPTY[1:]

	progress(0.25, desc="Parsing layer groups...")
	group_bounds = _parse_groups(group_text)

	# Validate Table 2 model selection
	name_a = table2_model_a if table2_model_a in model_dfs else None
	name_b = table2_model_b if table2_model_b in model_dfs else None
	if name_b == name_a:
	name_b = None

	progress(0.40, desc="Computing tables...")
	tables = generate_all_tables(
	model_dfs = model_dfs,
	group_bounds = group_bounds,
	name_a = name_a,
	name_b = name_b,
	)

	progress(0.65, desc="Formatting LaTeX & Markdown...")
	latex_str = format_all_latex(tables)
	md_str = format_all_markdown(tables)

	progress(0.80, desc="Saving files...")
	csv_paths = {}
	for key, df in tables.items():
	csv_paths[key] = _save_csv(df, f"wang_laws_{key}")

	latex_file = _save_text(latex_str, "wang_laws_tables.tex")
	md_file = _save_text(md_str, "wang_laws_tables.md")
	zip_file = _make_zip(list(csv_paths.values()) + [latex_file, md_file])

	loaded = list(model_dfs.keys())
	status = (
	f"✅ Generated 6 tables \| {len(loaded)} models loaded\n"
	f" Models: {', '.join(loaded)}\n"
	f" Layer groups (Table 2): {group_bounds}\n"
	f" Table 2 comparison: {name_a or '—'} vs {name_b or '—'}\n"
	f" Note: language modality, standard layers only (global layers excluded)"
	)

	progress(1.0)
	return (
	status,
	tables["t1"], tables["t2"], tables["t3"],
	tables["t4"], tables["t5"], tables["t6"],
	latex_str, md_str,
	csv_paths["t1"], csv_paths["t2"], csv_paths["t3"],
	csv_paths["t4"], csv_paths["t5"], csv_paths["t6"],
	latex_file, md_file, zip_file,
	)


	# ─────────────────────────────────────────────────────────────────────────────
	# Tab6 UI
	# ─────────────────────────────────────────────────────────────────────────────

	def build_tab_tables():
	with gr.Tab("📋 Tables"):
	gr.Markdown("""
	## Wang's Five Laws — Paper Tables

	One-click generation of all 6 tables. Data: language modality, standard layers only
	(global/K=V-shared layers excluded from all metrics).

	\| Table \| Content \| Law \|
	\|-------\|---------\|-----\|
	\| 1 \| Cross-model summary: Pearson r, SSR (Wang Score in Table 6) \| 1 & 2 \|
	\| 2 \| SSR layer-group trend (RL effect, user-defined groups) \| 2 \|
	\| 3 \| Output subspace cosU: Q–K, Q–V, K–V + random baseline \| 4 \|
	\| 4 \| Input subspace cosV: Q–K, Q–V, K–V + random baseline \| 5 \|
	\| 5 \| Condition number κ: median all layers + Layer 0 + deep layers \| 3 \|
	\| 6 \| Wang Score leaderboard (ranked) \| 1 & 2 \|

	> Run Tab 2 (Analyze) first to populate the database.
	""")

	# ── Model selector with Refresh ───────────────────────────────────────
	def _refresh_choices():
	new_choices = _get_model_choices()
	return (
	gr.CheckboxGroup(choices=new_choices, value=new_choices),
	gr.Dropdown(choices=new_choices),
	gr.Dropdown(choices=new_choices),
	)

	init_choices = _get_model_choices()

	# ── Controls ──────────────────────────────────────────────────────────
	with gr.Row():
	with gr.Column(scale=3):
	with gr.Row():
	gr.Markdown("Models to include (all tables use selected models)")
	refresh_btn = gr.Button("🔄 Refresh", scale=0, min_width=100)
	model_selector = gr.CheckboxGroup(
	choices = init_choices,
	value = init_choices,
	label = "",
	show_label=False,
	)
	with gr.Column(scale=2):
	gr.Markdown("Table 2 — SSR Layer-Group Comparison")
	t2_model_a = gr.Dropdown(
	choices = init_choices,
	value = init_choices[0] if init_choices else None,
	allow_custom_value=True,
	label = "Model A (base)",
	)
	t2_model_b = gr.Dropdown(
	choices = init_choices,
	value = init_choices[1] if len(init_choices) > 1 else None,
	allow_custom_value=True,
	label = "Model B (RL-tuned / comparison)",
	info = "Leave same as A for single-model view",
	)
	group_input = gr.Textbox(
	label = "Layer groups (comma-separated lo-hi pairs)",
	value = "0-11, 12-23, 24-35, 36-47",
	placeholder = "0-11, 12-23, 24-35, 36-47",
	info = "Adjust for model depth: 32-layer→0-7,8-15,16-23,24-31 60-layer→0-14,15-29,30-44,45-59",
	)

	generate_btn = gr.Button("🚀 Generate All Tables", variant="primary")
	status_box = gr.Textbox(lines=4, interactive=False, label="Status")

	gr.Markdown("---")

	# ── Table displays ────────────────────────────────────────────────────
	with gr.Accordion("📊 Table 1 — Cross-Model Summary (Law 1 & 2)", open=True):
	t1_df = gr.Dataframe(interactive=False, wrap=True)
	dl_t1 = gr.File(label="⬇ CSV")

	with gr.Accordion("📊 Table 2 — SSR Layer-Group Trend (Law 2)", open=True):
	t2_df = gr.Dataframe(interactive=False, wrap=True)
	dl_t2 = gr.File(label="⬇ CSV")

	with gr.Accordion("📊 Table 3 — Output Subspace cosU (Law 4)", open=True):
	t3_df = gr.Dataframe(interactive=False, wrap=True)
	dl_t3 = gr.File(label="⬇ CSV")

	with gr.Accordion("📊 Table 4 — Input Subspace cosV (Law 5)", open=True):
	t4_df = gr.Dataframe(interactive=False, wrap=True)
	dl_t4 = gr.File(label="⬇ CSV")

	with gr.Accordion("📊 Table 5 — Condition Number κ (Law 3)", open=True):
	t5_df = gr.Dataframe(interactive=False, wrap=True)
	dl_t5 = gr.File(label="⬇ CSV")

	with gr.Accordion("📊 Table 6 — Wang Score Leaderboard", open=True):
	t6_df = gr.Dataframe(interactive=False, wrap=True)
	dl_t6 = gr.File(label="⬇ CSV")

	gr.Markdown("---")

	# ── Text outputs ──────────────────────────────────────────────────────
	with gr.Accordion("📄 LaTeX Output (paste into .tex)", open=False):
	latex_box = gr.Code(
	language = "latex",
	label = "LaTeX tables (booktabs style)",
	interactive= False,
	lines = 30,
	)

	with gr.Accordion("📄 Markdown Output (paste into README)", open=False):
	md_box = gr.Code(
	language = "markdown",
	label = "Markdown tables (GitHub-flavored)",
	interactive= False,
	lines = 30,
	)

	gr.Markdown("---")

	# ── Bulk downloads ────────────────────────────────────────────────────
	gr.Markdown("### ⬇ Bulk Downloads")
	with gr.Row():
	dl_latex = gr.File(label="⬇ wang_laws_tables.tex")
	dl_md = gr.File(label="⬇ wang_laws_tables.md")
	dl_zip = gr.File(label="⬇ ZIP (all CSVs + LaTeX + Markdown)")

	gr.Markdown("""
	---
	Notes
	- All tables use language modality and standard layers only.
	Global (K=V-shared) layers are excluded from metrics but their count is shown in Table 1.
	- Table 2 layer groups are user-defined. Suggested defaults:
	48-layer models → `0-11, 12-23, 24-35, 36-47`
	32-layer models → `0-7, 8-15, 16-23, 24-31`
	60-layer models → `0-14, 15-29, 30-44, 45-59`
	- LaTeX output uses `booktabs` style (`\\toprule`, `\\midrule`, `\\bottomrule`).
	Add `\\usepackage{booktabs}` to your preamble.
	- Wang Score = 1 − median(SSR_QK). Theoretical maximum = 1.
	""")

	# ── Wiring ────────────────────────────────────────────────────────────
	generate_btn.click(
	fn = generate_tables,
	inputs = [model_selector, t2_model_a, t2_model_b, group_input],
	outputs = [
	status_box,
	t1_df, t2_df, t3_df, t4_df, t5_df, t6_df,
	latex_box, md_box,
	dl_t1, dl_t2, dl_t3, dl_t4, dl_t5, dl_t6,
	dl_latex, dl_md, dl_zip,
	],
	)

	refresh_btn.click(
	fn = _refresh_choices,
	inputs = [],
	outputs = [model_selector, t2_model_a, t2_model_b],
	)