Spaces:

ENC-PSL
/

lrec2026-llm-annotator

Running

App Files Files Community

add_support_ilaas_llm_provider

by lterriel - opened 3 days ago

base: refs/heads/main

←

from: refs/pr/2

Discussion Files changed

+2426

-1844

Files changed (6) hide show

.gitignore +5 -0
app.py +172 -83
prompts.py +25 -1
provider.py +82 -29
static/app.js +1206 -933
static/index.html +0 -0

.gitignore ADDED Viewed

	@@ -0,0 +1,5 @@

+.idea/
+__pycache__/
+*.pyc
+.DS_Store
+DS_Store

app.py CHANGED Viewed

@@ -5,6 +5,7 @@ file exposes a small REST API and a tiny in-memory session store. State is
 ephemeral and per-process; perfect for a single-user demo or HF Space.
 """
 from __future__ import annotations
 import asyncio
 import os
@@ -32,12 +33,14 @@ from io_utils import (
 )
 from moe import aggregate
 from provider import (
-    LLMClient, PROVIDERS, BASE_URLS,
-    CURATED_MODELS_BY_PROVIDER, test_connection_sync,
 )
 from tutorial import EXERCISES, prefill
 STATIC_DIR = APP_DIR / "static"
@@ -49,12 +52,17 @@ def _default_schema() -> AnnotationSchema:
     return from_preset("ud_upos_morph")
-ENV_API_KEY = os.environ.get("OPENROUTER_API_KEY", "")
-def _resolve_key(header_key: Optional[str]) -> str:
-    """Prefer the per-request header (client-side key), fall back to env (shared demo key)."""
-    return (header_key or "").strip() or ENV_API_KEY
 SESSION: dict[str, Any] = {
@@ -79,12 +87,12 @@ def _new_sentence(idx: int, surface_tokens: list[str], *, sentence_id: str = "",
         "id": sentence_id or f"s{idx + 1}",
         "language": language,
         "tokens": [{"surface": s} for s in surface_tokens],
-        "per_model": {},        # {model -> annotation dict}
-        "disagreements": [],    # list of dis dicts
-        "status": "pending",    # pending | annotating | done | error
         "error": "",
         "n_disagreements": 0,
-        "validated": False,     # True once the user confirms this sentence as gold
     }
@@ -100,7 +108,7 @@ def _public_state() -> dict:
         "language": sess["language"],
         "system_prompt": sess["system_prompt"],
         "user_template": sess["user_template"],
-        "has_env_key": bool(ENV_API_KEY),
         "models": sess["models"],
         "priority": sess["priority"],
         "temperature": sess["temperature"],
@@ -149,7 +157,7 @@ class LoadPasteReq(BaseModel):
     text: str
     tokenizer: str = "whitespace"  # whitespace | newline | as_is
     language: str = ""
-    split_per_line: bool = True    # True -> one sentence per non-empty line
 class LoadExerciseReq(BaseModel):
@@ -289,6 +297,12 @@ def load_paste(req: LoadPasteReq):
     return _public_state()
 @app.post("/api/corpus/exercise")
 def load_exercise(req: LoadExerciseReq):
     if req.idx < 0 or req.idx >= len(EXERCISES):
@@ -299,7 +313,11 @@ def load_exercise(req: LoadExerciseReq):
     SESSION["language"] = data["language_name"]
     SESSION["user_template"] = data["user_template"]
     SESSION["system_prompt"] = data["system_prompt"]
-    SESSION["models"] = list(data["models"])
     # Seed ICL pool with the example's pre-validated sandbox sentences
     pool = ICLPool()
     for ex in data["icl_examples"]:
@@ -332,7 +350,7 @@ def reset_all():
     SESSION["schema"] = _default_schema().to_dict()
     SESSION["language"] = ""
     SESSION["provider"] = "openrouter"
-    SESSION["models"] = list(CURATED_MODELS_BY_PROVIDER["openrouter"][:1])
     SESSION["priority"] = []
     SESSION["temperature"] = 0.0
     SESSION["n_icl"] = 5
@@ -345,22 +363,68 @@ def reset_all():
 # --- token edit ------------------------------------------------------------
 @app.post("/api/sentence/{idx}/token/{tidx}")
 def update_token(idx: int, tidx: int, req: TokenUpdateReq):
     sents = SESSION["sentences"]
     if idx < 0 or idx >= len(sents):
         raise HTTPException(404, "Bad sentence idx")
     if tidx < 0 or tidx >= len(sents[idx]["tokens"]):
         raise HTTPException(404, "Bad token idx")
-    # Preserve surface (never editable)
-    surface = sents[idx]["tokens"][tidx]["surface"]
     new_tok = {**req.token, "surface": surface}
-    sents[idx]["tokens"][tidx] = new_tok
-    # Remove this token from disagreement list if it was there
-    sents[idx]["disagreements"] = [d for d in sents[idx]["disagreements"] if d["token_idx"] != tidx]
-    sents[idx]["n_disagreements"] = len(sents[idx]["disagreements"])
-    return sents[idx]
 @app.post("/api/bulk_similar")
@@ -372,7 +436,11 @@ def bulk_similar(payload: dict):
         "updates": {"pos": "DET", "lemma": "ὁ"},
         "exclude": [{"s": sidx, "t": tidx}, ...]   # optional, e.g. the source token
     }
-    Returns: {"affected": [{"s": sidx, "t": tidx}, ...], "state": <_public_state>}
     """
     surface = payload.get("surface")
     updates = payload.get("updates") or {}
@@ -398,7 +466,13 @@ def bulk_similar(payload: dict):
             ]
             sent["n_disagreements"] = len(sent["disagreements"])
             affected.append({"s": sidx, "t": tidx})
-    return {"affected": affected, "state": _public_state()}
 @app.post("/api/sentence/{idx}/bulk")
@@ -415,39 +489,26 @@ def bulk_update(idx: int, payload: dict):
     for ti in idxs:
         if 0 <= ti < len(sents[idx]["tokens"]):
             sents[idx]["tokens"][ti][field] = value
-            sents[idx]["disagreements"] = [d for d in sents[idx]["disagreements"] if not (d["token_idx"] == ti and d["field_path"] == field)]
     sents[idx]["n_disagreements"] = len(sents[idx]["disagreements"])
     return sents[idx]
 # --- ICL pool --------------------------------------------------------------
 @app.post("/api/sentence/{idx}/add_to_icl")
 def add_sentence_to_icl(idx: int):
-    sents = SESSION["sentences"]
-    if idx < 0 or idx >= len(sents):
-        raise HTTPException(404, "Bad sentence idx")
-    sent = sents[idx]
-    schema_obj = schema_from_dict(SESSION["schema"])
-    pool: ICLPool = SESSION["icl_pool"]
-    ann = {
-        "sentence_id": sent["id"],
-        "language": sent["language"] or SESSION["language"],
-        "tokens": sent["tokens"],
-    }
-    pool.add(ICLExample(
-        language=sent["language"] or SESSION["language"] or "",
-        schema_hash=schema_obj.hash(),
-        tokens=[t["surface"] for t in sent["tokens"]],
-        gold_annotation=ann,
-        source="corrected",
-    ))
-    # Adding to ICL implies the user accepts this annotation as gold → mark validated.
-    sent["validated"] = True
-    return _public_state()
-@app.post("/api/sentence/{idx}/validate")
 def set_validated(idx: int, payload: dict):
     """payload = {value: bool}. Toggles the user-validation flag on a sentence."""
     sents = SESSION["sentences"]
@@ -472,10 +533,10 @@ def icl_download():
 # --- annotation ------------------------------------------------------------
 async def _annotate_sentence(sent: dict, client: LLMClient,
-                              schema: AnnotationSchema, sys_prompt: str,
-                              user_template: str, language: str,
-                              pool: ICLPool, n_icl: int, temperature: float,
-                              priority: list[str], models: list[str]) -> dict:
     tokens = [t["surface"] for t in sent["tokens"]]
     examples = pool.sample(
         n=int(n_icl), schema_hash=schema.hash(),
@@ -533,59 +594,74 @@ async def _annotate_sentence(sent: dict, client: LLMClient,
 @app.post("/api/annotate")
 async def annotate(
-    req: AnnotateReq,
-    x_api_key: Optional[str] = Header(default=None),
-    x_openrouter_key: Optional[str] = Header(default=None),  # back-compat
-    x_llm_provider: Optional[str] = Header(default=None),
 ):
     sess = SESSION
     provider = (x_llm_provider or sess["provider"]).strip()
     if provider not in PROVIDERS:
         raise HTTPException(400, f"Unknown provider {provider!r}")
-    api_key = _resolve_key(x_api_key or x_openrouter_key)
     if not api_key:
         raise HTTPException(400, f"Set your {provider} API key first.")
     if not sess["models"]:
         raise HTTPException(400, "Select at least one model.")
     if provider != "openrouter" and len(sess["models"]) > 1:
-        raise HTTPException(400, f"MoE (multiple models) is only supported on OpenRouter. Pick one model for {provider}.")
     schema_obj = schema_from_dict(sess["schema"])
-    client = LLMClient(provider=provider, api_key=api_key)
-    pool: ICLPool = sess["icl_pool"]
-    sents = sess["sentences"]
-    target_idxs = req.sentence_idxs if req.sentence_idxs is not None else list(range(len(sents)))
-    coros = []
-    for i in target_idxs:
-        if 0 <= i < len(sents):
-            sents[i]["status"] = "annotating"
-            coros.append(_annotate_sentence(
-                sents[i], client, schema_obj, sess["system_prompt"], sess["user_template"],
-                sess["language"], pool, sess["n_icl"], sess["temperature"],
-                sess["priority"], sess["models"],
-            ))
-    await asyncio.gather(*coros)
     return _public_state()
 @app.post("/api/annotate/token")
 async def annotate_one_token(
-    payload: dict,
-    x_api_key: Optional[str] = Header(default=None),
-    x_openrouter_key: Optional[str] = Header(default=None),
-    x_llm_provider: Optional[str] = Header(default=None),
 ):
     """Re-ask a specific model for a specific token. payload = {sent: int, tok: int, model: str}"""
     sess = SESSION
     provider = (x_llm_provider or sess["provider"]).strip()
     if provider not in PROVIDERS:
         raise HTTPException(400, f"Unknown provider {provider!r}")
-    api_key = _resolve_key(x_api_key or x_openrouter_key)
     if not api_key:
         raise HTTPException(400, f"Set your {provider} API key first.")
     idx = int(payload["sent"])
     tidx = int(payload["tok"])
     model = str(payload["model"])
     sent = sess["sentences"][idx]
     schema = schema_from_dict(sess["schema"])
     tokens = [t["surface"] for t in sent["tokens"]]
     pool: ICLPool = sess["icl_pool"]
@@ -595,13 +671,26 @@ async def annotate_one_token(
         language=sess["language"] or sent["language"], sentence_id=sent["id"],
         few_shot_examples=examples,
     ) + f"\n\nFocus especially on token index {tidx} (surface={tokens[tidx]!r}). Return JSON for all tokens; preserve the order."
-    client = LLMClient(provider=provider, api_key=api_key)
-    result = await client.annotate_one(
-        system=sess["system_prompt"], user=rendered_user,
-        schema=schema, model=model, temperature=float(sess["temperature"]),
-    )
     if not result.ok or not result.annotation:
         raise HTTPException(502, f"{model} failed: {result.error}")
     # update only the targeted token
     new_tok = result.annotation["tokens"][tidx]
     new_tok["surface"] = tokens[tidx]
@@ -668,7 +757,7 @@ def validate_sentence(idx: int):
 app.mount("/static", StaticFiles(directory=str(STATIC_DIR)), name="static")
 if __name__ == "__main__":
     import uvicorn
     uvicorn.run("app:app", host="0.0.0.0", port=7860, reload=False)

 ephemeral and per-process; perfect for a single-user demo or HF Space.
 """
 from __future__ import annotations
+from copy import deepcopy
 import asyncio
 import os
 )
 from moe import aggregate
 from provider import (
+    LLMClient,
+    PROVIDERS,
+    BASE_URLS,
+    CURATED_MODELS_BY_PROVIDER,
+    test_connection_sync
 )
 from tutorial import EXERCISES, prefill
 STATIC_DIR = APP_DIR / "static"
     return from_preset("ud_upos_morph")
+ENV_API_KEYS = {
+    "openrouter": os.environ.get("OPENROUTER_API_KEY", ""),
+    "mistral": os.environ.get("MISTRAL_API_KEY", ""),
+    "openai": os.environ.get("OPENAI_API_KEY", ""),
+    "ilaas": os.environ.get("ILAAS_API_KEY", ""),
+}
+def _resolve_key(provider: str, header_key: Optional[str]) -> str:
+    """Prefer the per-request header, fall back to provider-specific env key."""
+    return (header_key or "").strip() or ENV_API_KEYS.get(provider, "")
 SESSION: dict[str, Any] = {
         "id": sentence_id or f"s{idx + 1}",
         "language": language,
         "tokens": [{"surface": s} for s in surface_tokens],
+        "per_model": {},  # {model -> annotation dict}
+        "disagreements": [],  # list of dis dicts
+        "status": "pending",  # pending | annotating | done | error
         "error": "",
         "n_disagreements": 0,
+        "validated": False,  # True once the user confirms this sentence as gold
     }
         "language": sess["language"],
         "system_prompt": sess["system_prompt"],
         "user_template": sess["user_template"],
+        "has_env_key": bool(ENV_API_KEYS.get(sess["provider"], "")),
         "models": sess["models"],
         "priority": sess["priority"],
         "temperature": sess["temperature"],
     text: str
     tokenizer: str = "whitespace"  # whitespace | newline | as_is
     language: str = ""
+    split_per_line: bool = True  # True -> one sentence per non-empty line
 class LoadExerciseReq(BaseModel):
     return _public_state()
+def _default_models_for_provider(provider: str) -> list[str]:
+    """Helper to get the default model(s) for a provider, used when switching providers."""
+    curated = CURATED_MODELS_BY_PROVIDER.get(provider) or []
+    return list(curated[:1])
 @app.post("/api/corpus/exercise")
 def load_exercise(req: LoadExerciseReq):
     if req.idx < 0 or req.idx >= len(EXERCISES):
     SESSION["language"] = data["language_name"]
     SESSION["user_template"] = data["user_template"]
     SESSION["system_prompt"] = data["system_prompt"]
+    # Exercise presets may contain OpenRouter slugs. Keep them only when using OpenRouter.
+    if SESSION["provider"] == "openrouter":
+        SESSION["models"] = list(data["models"])
+    else:
+        SESSION["models"] = _default_models_for_provider(SESSION["provider"])
     # Seed ICL pool with the example's pre-validated sandbox sentences
     pool = ICLPool()
     for ex in data["icl_examples"]:
     SESSION["schema"] = _default_schema().to_dict()
     SESSION["language"] = ""
     SESSION["provider"] = "openrouter"
+    SESSION["models"] = _default_models_for_provider("openrouter")
     SESSION["priority"] = []
     SESSION["temperature"] = 0.0
     SESSION["n_icl"] = 5
 # --- token edit ------------------------------------------------------------
+def _add_or_update_sentence_in_icl(idx: int) -> str:
+    sents = SESSION["sentences"]
+    if idx < 0 or idx >= len(sents):
+        raise HTTPException(404, "Bad sentence idx")
+    sent = sents[idx]
+    schema_obj = schema_from_dict(SESSION["schema"])
+    pool: ICLPool = SESSION["icl_pool"]
+    tokens_snapshot = deepcopy(sent["tokens"])
+    ann = {
+        "sentence_id": sent["id"],
+        "language": sent["language"] or SESSION["language"],
+        "tokens": tokens_snapshot,
+    }
+    result = pool.add(ICLExample(
+        language=sent["language"] or SESSION["language"] or "",
+        schema_hash=schema_obj.hash(),
+        tokens=[t["surface"] for t in tokens_snapshot],
+        gold_annotation=ann,
+        source="corrected",
+    ))
+    sent["validated"] = True
+    return result
 @app.post("/api/sentence/{idx}/token/{tidx}")
 def update_token(idx: int, tidx: int, req: TokenUpdateReq):
     sents = SESSION["sentences"]
     if idx < 0 or idx >= len(sents):
         raise HTTPException(404, "Bad sentence idx")
     if tidx < 0 or tidx >= len(sents[idx]["tokens"]):
         raise HTTPException(404, "Bad token idx")
+    sent = sents[idx]
+    was_validated = bool(sent.get("validated"))
+    surface = sent["tokens"][tidx]["surface"]
     new_tok = {**req.token, "surface": surface}
+    sent["tokens"][tidx] = new_tok
+    sent["disagreements"] = [
+        d for d in sent["disagreements"]
+        if d["token_idx"] != tidx
+    ]
+    sent["n_disagreements"] = len(sent["disagreements"])
+    icl_result = None
+    # If sentence in ICL pool already, update it. If not, add it. This way we keep the pool in sync with user corrections.
+    if was_validated:
+        icl_result = _add_or_update_sentence_in_icl(idx)
+    state = _public_state()
+    state["updated_sentence_idx"] = idx
+    state["icl_add_result"] = icl_result
+    state["icl_duplicate"] = icl_result == "unchanged"
+    state["icl_updated"] = icl_result == "updated"
+    state["icl_inserted"] = icl_result == "inserted"
+    return state
 @app.post("/api/bulk_similar")
         "updates": {"pos": "DET", "lemma": "ὁ"},
         "exclude": [{"s": sidx, "t": tidx}, ...]   # optional, e.g. the source token
     }
+    Returns:
+        {
+            "affected": [{"s": sidx, "t": tidx}, ...],
+            "sentences": [{"idx": sidx, "sentence": {...}}, ...]
+        }
     """
     surface = payload.get("surface")
     updates = payload.get("updates") or {}
             ]
             sent["n_disagreements"] = len(sent["disagreements"])
             affected.append({"s": sidx, "t": tidx})
+    return {
+        "affected": affected,
+        "sentences": [
+            {"idx": i, "sentence": SESSION["sentences"][i]}
+            for i in sorted({a["s"] for a in affected})
+        ],
+    }
 @app.post("/api/sentence/{idx}/bulk")
     for ti in idxs:
         if 0 <= ti < len(sents[idx]["tokens"]):
             sents[idx]["tokens"][ti][field] = value
+            sents[idx]["disagreements"] = [d for d in sents[idx]["disagreements"] if
+                                           not (d["token_idx"] == ti and d["field_path"] == field)]
     sents[idx]["n_disagreements"] = len(sents[idx]["disagreements"])
     return sents[idx]
 # --- ICL pool --------------------------------------------------------------
 @app.post("/api/sentence/{idx}/add_to_icl")
 def add_sentence_to_icl(idx: int):
+    result = _add_or_update_sentence_in_icl(idx)
+    state = _public_state()
+    state["icl_add_result"] = result
+    state["icl_duplicate"] = result == "unchanged"
+    state["icl_updated"] = result == "updated"
+    state["icl_inserted"] = result == "inserted"
+    return state
+@app.post("/api/sentence/{idx}/sent_score")
 def set_validated(idx: int, payload: dict):
     """payload = {value: bool}. Toggles the user-validation flag on a sentence."""
     sents = SESSION["sentences"]
 # --- annotation ------------------------------------------------------------
 async def _annotate_sentence(sent: dict, client: LLMClient,
+                             schema: AnnotationSchema, sys_prompt: str,
+                             user_template: str, language: str,
+                             pool: ICLPool, n_icl: int, temperature: float,
+                             priority: list[str], models: list[str]) -> dict:
     tokens = [t["surface"] for t in sent["tokens"]]
     examples = pool.sample(
         n=int(n_icl), schema_hash=schema.hash(),
 @app.post("/api/annotate")
 async def annotate(
+        req: AnnotateReq,
+        x_api_key: Optional[str] = Header(default=None),
+        x_openrouter_key: Optional[str] = Header(default=None),  # back-compat
+        x_llm_provider: Optional[str] = Header(default=None),
 ):
     sess = SESSION
     provider = (x_llm_provider or sess["provider"]).strip()
     if provider not in PROVIDERS:
         raise HTTPException(400, f"Unknown provider {provider!r}")
+    api_key = _resolve_key(provider, x_api_key or x_openrouter_key)
     if not api_key:
         raise HTTPException(400, f"Set your {provider} API key first.")
     if not sess["models"]:
         raise HTTPException(400, "Select at least one model.")
     if provider != "openrouter" and len(sess["models"]) > 1:
+        raise HTTPException(400,
+                            f"MoE (multiple models) is only supported on OpenRouter. Pick one model for {provider}.")
     schema_obj = schema_from_dict(sess["schema"])
+    if provider != "openrouter":
+        allowed = set(CURATED_MODELS_BY_PROVIDER.get(provider) or [])
+        unknown = [m for m in sess["models"] if m not in allowed]
+        if unknown:
+            raise HTTPException(
+                400,
+                f"Model(s) not available for provider {provider}: {unknown}. "
+                f"Pick one of: {sorted(allowed)}"
+            )
+    async with LLMClient(provider=provider, api_key=api_key) as client:
+        pool: ICLPool = sess["icl_pool"]
+        sents = sess["sentences"]
+        target_idxs = req.sentence_idxs if req.sentence_idxs is not None else list(range(len(sents)))
+        coros = []
+        for i in target_idxs:
+            if 0 <= i < len(sents):
+                sents[i]["status"] = "annotating"
+                coros.append(_annotate_sentence(
+                    sents[i], client, schema_obj, sess["system_prompt"], sess["user_template"],
+                    sess["language"], pool, sess["n_icl"], sess["temperature"],
+                    sess["priority"], sess["models"],
+                ))
+        await asyncio.gather(*coros)
     return _public_state()
 @app.post("/api/annotate/token")
 async def annotate_one_token(
+        payload: dict,
+        x_api_key: Optional[str] = Header(default=None),
+        x_openrouter_key: Optional[str] = Header(default=None),
+        x_llm_provider: Optional[str] = Header(default=None),
 ):
     """Re-ask a specific model for a specific token. payload = {sent: int, tok: int, model: str}"""
     sess = SESSION
     provider = (x_llm_provider or sess["provider"]).strip()
     if provider not in PROVIDERS:
         raise HTTPException(400, f"Unknown provider {provider!r}")
+    api_key = _resolve_key(provider, x_api_key or x_openrouter_key)
     if not api_key:
         raise HTTPException(400, f"Set your {provider} API key first.")
     idx = int(payload["sent"])
     tidx = int(payload["tok"])
     model = str(payload["model"])
+    if idx < 0 or idx >= len(sess["sentences"]):
+        raise HTTPException(404, "Bad sentence idx")
     sent = sess["sentences"][idx]
+    if tidx < 0 or tidx >= len(sent["tokens"]):
+        raise HTTPException(404, "Bad token idx")
     schema = schema_from_dict(sess["schema"])
     tokens = [t["surface"] for t in sent["tokens"]]
     pool: ICLPool = sess["icl_pool"]
         language=sess["language"] or sent["language"], sentence_id=sent["id"],
         few_shot_examples=examples,
     ) + f"\n\nFocus especially on token index {tidx} (surface={tokens[tidx]!r}). Return JSON for all tokens; preserve the order."
+    if provider != "openrouter":
+        allowed = set(CURATED_MODELS_BY_PROVIDER.get(provider) or [])
+        if model not in allowed:
+            raise HTTPException(
+                400,
+                f"Model {model!r} is not available for provider {provider}. "
+                f"Pick one of: {sorted(allowed)}"
+            )
+    async with LLMClient(provider=provider, api_key=api_key) as client:
+        result = await client.annotate_one(
+            system=sess["system_prompt"],
+            user=rendered_user,
+            schema=schema,
+            model=model,
+            temperature=float(sess["temperature"]),
+        )
     if not result.ok or not result.annotation:
         raise HTTPException(502, f"{model} failed: {result.error}")
+    if tidx >= len(result.annotation.get("tokens", [])):
+        raise HTTPException(502, f"{model} returned too few tokens.")
     # update only the targeted token
     new_tok = result.annotation["tokens"][tidx]
     new_tok["surface"] = tokens[tidx]
 app.mount("/static", StaticFiles(directory=str(STATIC_DIR)), name="static")
 if __name__ == "__main__":
     import uvicorn
     uvicorn.run("app:app", host="0.0.0.0", port=7860, reload=False)

prompts.py CHANGED Viewed

@@ -5,6 +5,7 @@ written material. ICLPool keeps a session-scoped, filterable bank of validated
 or corrected examples.
 """
 from __future__ import annotations
 import json
 import random
@@ -30,6 +31,8 @@ class ICLExample:
     note: str = ""
 @dataclass
 class ICLPool:
     """Session-scoped pool of in-context examples.
@@ -40,9 +43,30 @@ class ICLPool:
     entries: list[ICLExample] = field(default_factory=list)
     version: int = 0
-    def add(self, ex: ICLExample) -> None:
         self.entries.append(ex)
         self.version += 1
     def filter(self, language: str = "", schema_hash: str = "") -> list[ICLExample]:
         out = self.entries

 or corrected examples.
 """
 from __future__ import annotations
+from copy import deepcopy
 import json
 import random
     note: str = ""
 @dataclass
 class ICLPool:
     """Session-scoped pool of in-context examples.
     entries: list[ICLExample] = field(default_factory=list)
     version: int = 0
+    def _key(self, ex: ICLExample) -> tuple[str, str, tuple[str, ...]]:
+        return (
+            ex.language or "",
+            ex.schema_hash or "",
+            tuple(ex.tokens or []),
+        )
+    def _same_content(self, a: ICLExample, b: ICLExample) -> bool:
+        return a.gold_annotation == b.gold_annotation
+    def add(self, ex: ICLExample) -> str:
+        ex = deepcopy(ex)
+        key = self._key(ex)
+        for i, existing in enumerate(self.entries):
+            if self._key(existing) == key:
+                if self._same_content(existing, ex):
+                    return "unchanged"
+                self.entries[i] = ex
+                self.version += 1
+                return "updated"
         self.entries.append(ex)
         self.version += 1
+        return "inserted"
     def filter(self, language: str = "", schema_hash: str = "") -> list[ICLExample]:
         out = self.entries

provider.py CHANGED Viewed

@@ -4,6 +4,7 @@ Supports three OpenAI-compatible providers via parametric base URL:
 - openrouter : https://openrouter.ai/api/v1   (MoE: many models behind one key)
 - mistral    : https://api.mistral.ai/v1
 - openai     : https://api.openai.com/v1
 All three accept the same OpenAI Chat Completions request shape, including
 `response_format` (json_schema strict on OpenAI; json_object on Mistral; varies
@@ -24,14 +25,16 @@ from prompts import VALIDATION_RETRY
 DEFAULT_TIMEOUT = 60.0
-PROVIDERS = ("openrouter", "mistral", "openai")
 BASE_URLS = {
     "openrouter": "https://openrouter.ai/api/v1",
-    "mistral":    "https://api.mistral.ai/v1",
-    "openai":     "https://api.openai.com/v1",
 }
 CURATED_MODELS_BY_PROVIDER: dict[str, list[str]] = {
     "openrouter": [
         "openai/gpt-oss-20b:free",
@@ -55,6 +58,14 @@ CURATED_MODELS_BY_PROVIDER: dict[str, list[str]] = {
         "gpt-5-2025-08-07",
         "gpt-4o-mini-2024-07-18",
     ],
 }
 # Back-compat alias used by other modules
@@ -81,33 +92,55 @@ def _build_headers(provider: str, api_key: str) -> dict:
         h["X-Title"] = "LREC2026 LLM-as-Annotator"
     return h
 class LLMClient:
-    def __init__(self, provider: str, api_key: str):
         if provider not in BASE_URLS:
-            raise ValueError(f"Unknown provider {provider!r}; expected one of {PROVIDERS}")
         self.provider = provider
         self.api_key = api_key
         self.base_url = BASE_URLS[provider]
         self.endpoint = self.base_url + "/chat/completions"
         self.headers = _build_headers(provider, api_key)
     async def annotate_one(
-        self,
-        *,
-        system: str,
-        user: str,
-        schema: AnnotationSchema,
-        model: str,
-        temperature: float = 0.0,
-        timeout: float = DEFAULT_TIMEOUT,
     ) -> ModelResult:
         """Call one model, validate JSON. One retry on schema-validation failure."""
         json_schema = to_json_schema(schema)
         start = time.time()
         msgs = [{"role": "system", "content": system}, {"role": "user", "content": user}]
         try:
-            async with httpx.AsyncClient(timeout=timeout) as client:
                 raw_text = await self._call(client, msgs, json_schema, model, temperature)
                 ann, err = self._parse_and_validate(raw_text, schema)
                 if err:
@@ -117,20 +150,28 @@ class LLMClient:
                     raw_text = await self._call(client, msgs, json_schema, model, temperature)
                     ann, err = self._parse_and_validate(raw_text, schema)
                 if err:
-                    return ModelResult(model=model, ok=False, annotation=None, latency_s=time.time() - start, error=err, raw=raw_text)
                 return ModelResult(model=model, ok=True, annotation=ann, latency_s=time.time() - start, raw=raw_text)
         except Exception as e:
             return ModelResult(model=model, ok=False, annotation=None, latency_s=time.time() - start, error=str(e))
     async def annotate_many(
-        self,
-        *,
-        models: list[str],
-        system: str,
-        user: str,
-        schema: AnnotationSchema,
-        temperature: float = 0.0,
-        timeout: float = DEFAULT_TIMEOUT,
     ) -> list[ModelResult]:
         coros = [
             self.annotate_one(
@@ -140,26 +181,38 @@ class LLMClient:
         ]
         return await asyncio.gather(*coros)
-    async def _call(self, client: httpx.AsyncClient, msgs: list[dict], json_schema: dict, model: str, temperature: float) -> str:
         # Strict json_schema works on OpenAI and most OpenRouter models. For Mistral and
         # for some open-source models routed via OpenRouter, fall back to json_object.
-        if self.provider == "mistral":
             payload = {
-                "model": model, "messages": msgs, "temperature": temperature,
                 "response_format": {"type": "json_object"},
             }
         else:
             payload = {
-                "model": model, "messages": msgs, "temperature": temperature,
                 "response_format": {
                     "type": "json_schema",
-                    "json_schema": {"name": "annotation", "strict": True, "schema": json_schema},
                 },
             }
         resp = await client.post(self.endpoint, headers=self.headers, json=payload)
         if resp.status_code >= 400:
             payload["response_format"] = {"type": "json_object"}
             resp = await client.post(self.endpoint, headers=self.headers, json=payload)
         resp.raise_for_status()
         data = resp.json()
         return data["choices"][0]["message"]["content"] or ""

 - openrouter : https://openrouter.ai/api/v1   (MoE: many models behind one key)
 - mistral    : https://api.mistral.ai/v1
 - openai     : https://api.openai.com/v1
+- ilaas      : https://llm.ilaas.fr/v1 (documentation: https://www.ilaas.fr/services-inference/)
 All three accept the same OpenAI Chat Completions request shape, including
 `response_format` (json_schema strict on OpenAI; json_object on Mistral; varies
 DEFAULT_TIMEOUT = 60.0
 BASE_URLS = {
     "openrouter": "https://openrouter.ai/api/v1",
+    "mistral": "https://api.mistral.ai/v1",
+    "openai": "https://api.openai.com/v1",
+    "ilaas": "https://llm.ilaas.fr/v1",
 }
+PROVIDERS = tuple(BASE_URLS.keys())
 CURATED_MODELS_BY_PROVIDER: dict[str, list[str]] = {
     "openrouter": [
         "openai/gpt-oss-20b:free",
         "gpt-5-2025-08-07",
         "gpt-4o-mini-2024-07-18",
     ],
+    "ilaas": [
+        "gemma-4-31b",
+        "gpt-oss-120b",
+        "llama-3.1-8b",
+        "llama-3.3-70b",
+        "qwen-3.6-35b-instruct",
+        "mistral-small-3.2-24b",
+    ]
 }
 # Back-compat alias used by other modules
         h["X-Title"] = "LREC2026 LLM-as-Annotator"
     return h
 class LLMClient:
+    def __init__(self, provider: str, api_key: str, timeout: float = DEFAULT_TIMEOUT):
         if provider not in BASE_URLS:
+            raise ValueError(f"Unknown provider {provider!r}; expected one of {tuple(BASE_URLS)}")
         self.provider = provider
         self.api_key = api_key
         self.base_url = BASE_URLS[provider]
         self.endpoint = self.base_url + "/chat/completions"
         self.headers = _build_headers(provider, api_key)
+        self.timeout = timeout
+        self._client: httpx.AsyncClient | None = None
+    async def __aenter__(self):
+        self._client = httpx.AsyncClient(
+            timeout=self.timeout,
+            limits=httpx.Limits(
+                max_connections=20,
+                max_keepalive_connections=10,
+            ),
+        )
+        return self
+    async def __aexit__(self, exc_type, exc, tb):
+        if self._client:
+            await self._client.aclose()
+            self._client = None
     async def annotate_one(
+            self,
+            *,
+            system: str,
+            user: str,
+            schema: AnnotationSchema,
+            model: str,
+            temperature: float = 0.0,
+            timeout: float = DEFAULT_TIMEOUT,
     ) -> ModelResult:
         """Call one model, validate JSON. One retry on schema-validation failure."""
+        print(f"[LLM] start provider={self.provider} model={model}")
         json_schema = to_json_schema(schema)
         start = time.time()
         msgs = [{"role": "system", "content": system}, {"role": "user", "content": user}]
         try:
+            client = self._client
+            close_after = False
+            if client is None:
+                client = httpx.AsyncClient(timeout=timeout)
+                close_after = True
+            try:
                 raw_text = await self._call(client, msgs, json_schema, model, temperature)
                 ann, err = self._parse_and_validate(raw_text, schema)
                 if err:
                     raw_text = await self._call(client, msgs, json_schema, model, temperature)
                     ann, err = self._parse_and_validate(raw_text, schema)
                 if err:
+                    print(
+                        f"[LLM] error provider={self.provider} model={model} latency={time.time() - start:.2f}s error={e}")
+                    return ModelResult(model=model, ok=False, annotation=None, latency_s=time.time() - start, error=err,
+                                       raw=raw_text)
+                print(f"[LLM] done provider={self.provider} model={model} latency={time.time() - start:.2f}s")
                 return ModelResult(model=model, ok=True, annotation=ann, latency_s=time.time() - start, raw=raw_text)
+            finally:
+                if close_after:
+                    await client.aclose()
         except Exception as e:
+            print(f"[LLM] error provider={self.provider} model={model} latency={time.time() - start:.2f}s error={e}")
             return ModelResult(model=model, ok=False, annotation=None, latency_s=time.time() - start, error=str(e))
     async def annotate_many(
+            self,
+            *,
+            models: list[str],
+            system: str,
+            user: str,
+            schema: AnnotationSchema,
+            temperature: float = 0.0,
+            timeout: float = DEFAULT_TIMEOUT,
     ) -> list[ModelResult]:
         coros = [
             self.annotate_one(
         ]
         return await asyncio.gather(*coros)
+    async def _call(self, client: httpx.AsyncClient, msgs: list[dict], json_schema: dict, model: str,
+                    temperature: float) -> str:
         # Strict json_schema works on OpenAI and most OpenRouter models. For Mistral and
         # for some open-source models routed via OpenRouter, fall back to json_object.
+        if self.provider in {"mistral", "ilaas"}:
             payload = {
+                "model": model,
+                "messages": msgs,
+                "temperature": temperature,
                 "response_format": {"type": "json_object"},
             }
         else:
             payload = {
+                "model": model,
+                "messages": msgs,
+                "temperature": temperature,
                 "response_format": {
                     "type": "json_schema",
+                    "json_schema": {
+                        "name": "annotation",
+                        "strict": True,
+                        "schema": json_schema,
+                    },
                 },
             }
         resp = await client.post(self.endpoint, headers=self.headers, json=payload)
         if resp.status_code >= 400:
             payload["response_format"] = {"type": "json_object"}
             resp = await client.post(self.endpoint, headers=self.headers, json=payload)
+        if resp.status_code >= 400:
+            payload.pop("response_format", None)
+            resp = await client.post(self.endpoint, headers=self.headers, json=payload)
         resp.raise_for_status()
         data = resp.json()
         return data["choices"][0]["message"]["content"] or ""

static/app.js CHANGED Viewed

@@ -1,948 +1,1221 @@
 // LREC 2026 — LLM Annotator front-end logic (Alpine.js)
 function annotator() {
-  return {
-    // ----------- state -----------
-    paperLink: 'https://aclanthology.org/2026.loreslm-1.28/',
-    loading: false,
-    progressText: 'Annotating…',
-    modal: null,
-    cheatsheetHtml: '',
-    toasts: [],
-    nextToastId: 1,
-    focus: { sent: null, tok: null },
-    selection: new Set(),
-    ctxMenu: { open: false, x: 0, y: 0, s: null, t: null },
-    guideDismissed: false,
-    moeBannerDismissed: false,
-    moeHintDismissed: false,
-    // Per-provider client-side keys; persisted in sessionStorage only
-    localKeys: { openrouter: '', mistral: '', openai: '' },
-    state: {
-      schema: null,
-      schema_hash: '',
-      json_schema: {},
-      language: '',
-      system_prompt: '',
-      user_template: '',
-      has_env_key: false,
-      provider: 'openrouter',
-      providers: ['openrouter', 'mistral', 'openai'],
-      curated_models_by_provider: {},
-      models: [],
-      priority: [],
-      temperature: 0,
-      n_icl: 5,
-      icl_pool: { version: 0, size: 0, entries: [] },
-      sentences: [],
-      presets: [],
-      curated_models: [],
-      aggregators: [],
-      exercises: [],
-    },
-    editor: {
-      sidx: null, tidx: null,
-      tok: null,
-      original: null,            // snapshot at modal-open, used to diff field changes
-      perModel: {},
-      disagreementCells: [],
-      search: {},
-      filtered: {},
-      autoAdvance: true,
-      propagateToSimilar: false,
-    },
-    taskEditor: { json: '' },
-    modelEditor: { custom: '', priority: '' },
-    keyEditor: { value: '', testing: false, result: '', ok: false },
-    pasteEditor: {
-      text: '',
-      tokenizer: 'whitespace',
-      language: '',
-      presetKey: 'ud_upos_morph',
-      customTaskName: 'My custom task',
-      customTagInput: '',
-      customTags: [],
-      includeNone: true,
-      includeConfidence: true,
-      includeComment: false,
-    },
-    advEditor: { system_prompt: '', user_template: '', n_icl: 5, temperature: 0 },
-    bulkEditor: { field: '', value: '' },
-    // ----------- derived -----------
-    get schema() { return this.state.schema; },
-    get schemaFields() {
-      const f = (this.state.schema && this.state.schema.fields) || [];
-      return f;
-    },
-    get totalTokens() {
-      return this.state.sentences.reduce((a, s) => a + s.tokens.length, 0);
-    },
-    get totalDisagreements() {
-      return this.state.sentences.reduce((a, s) => a + (s.n_disagreements || 0), 0);
-    },
-    // ----------- key helpers (per-provider) -----------
-    get localKey() { return this.localKeys[this.state.provider] || ''; },
-    setLocalKey(value) {
-      const p = this.state.provider;
-      this.localKeys = { ...this.localKeys, [p]: value };
-      try { sessionStorage.setItem('llm_keys', JSON.stringify(this.localKeys)); } catch (e) {}
-    },
-    get hasKey() {
-      // env key is OpenRouter-only on the server side
-      const envOk = this.state.provider === 'openrouter' && !!this.state.has_env_key;
-      return !!this.localKey || envOk;
-    },
-    get canRun() {
-      return this.hasKey && this.state.models.length > 0 && this.state.sentences.length > 0;
-    },
-    keyHeaders() {
-      const h = { 'X-LLM-Provider': this.state.provider };
-      if (this.localKey) h['X-API-Key'] = this.localKey;
-      return h;
-    },
-    // ----------- init -----------
-    async init() {
-      this.guideDismissed = localStorage.getItem('guideDismissed') === '1';
-      this.moeBannerDismissed = localStorage.getItem('moeBannerDismissed') === '1';
-      this.moeHintDismissed = localStorage.getItem('moeHintDismissed') === '1';
-      // Load per-provider keys; migrate legacy single-key key if present
-      try {
-        const raw = sessionStorage.getItem('llm_keys');
-        if (raw) this.localKeys = { openrouter: '', mistral: '', openai: '', ...JSON.parse(raw) };
-        const legacy = sessionStorage.getItem('openrouter_key');
-        if (legacy && !this.localKeys.openrouter) {
-          this.localKeys = { ...this.localKeys, openrouter: legacy };
-          sessionStorage.setItem('llm_keys', JSON.stringify(this.localKeys));
-          sessionStorage.removeItem('openrouter_key');
-        }
-      } catch (e) {}
-      await this.refresh();
-      try {
-        const r = await fetch('/api/cheatsheet');
-        const txt = await r.text();
-        this.cheatsheetHtml = this.markdownToHtml(txt);
-      } catch (e) {}
-      // sync editor mirrors
-      this.taskEditor.json = JSON.stringify(this.state.schema, null, 2);
-      this.modelEditor.priority = this.state.priority.join(', ');
-      this.advEditor.system_prompt = this.state.system_prompt;
-      this.advEditor.user_template = this.state.user_template;
-      this.advEditor.n_icl = this.state.n_icl;
-      this.advEditor.temperature = this.state.temperature;
-      window.addEventListener('keydown', (e) => this.globalKey(e));
-      // persist dismissals
-      this.$watch?.('moeBannerDismissed', v => localStorage.setItem('moeBannerDismissed', v ? '1' : '0'));
-      this.$watch?.('moeHintDismissed', v => localStorage.setItem('moeHintDismissed', v ? '1' : '0'));
-    },
-    // ----------- contextual guide -----------
-    get guide() {
-      const s = this.state;
-      if (s.sentences.length === 0) {
-        return {
-          step: 1, icon: '📜', title: 'Load a corpus to start',
-          body: 'Pick a sandbox example in the left sidebar — Greek, Armenian or Syriac. They come with a task preset, a validated tagset, and 3–5 pre-loaded ICL examples (visible in the toolbar: <strong>ICL pool · v3 · 5 ex</strong>).',
-          actions: [
-            { label: '📘 Try Armenian (HYE)', handler: 'loadExercise', arg: 1 },
-            { label: 'Paste my own text', handler: 'modal', arg: 'paste' },
-          ],
-        };
-      }
-      if (!this.hasKey) {
-        return {
-          step: 2, icon: '🔑', title: 'Add your OpenRouter API key',
-          body: 'One key gives you access to Claude, GPT, Mistral, Llama, Qwen, DeepSeek and more. The key is kept <strong>in this browser tab only</strong> (sessionStorage) and never sent to or stored on the server — you can wipe it with the <strong>Clear key</strong> button at any time.',
-          actions: [
-            { label: 'Add API key', handler: 'modal', arg: 'key' },
-            { label: 'Get a key →', handler: 'openExternal', arg: 'https://openrouter.ai/keys' },
-          ],
-        };
-      }
-      const anyDone = s.sentences.some(x => x.status === 'done');
-      const anyPending = s.sentences.some(x => x.status === 'pending');
-      const totalDis = this.totalDisagreements;
-      const lastWasMoE = s.sentences.some(x => Object.keys(x.per_model || {}).length >= 2);
-      if (!anyDone) {
-        const moeNote = s.models.length >= 2
-          ? `<strong>MoE is ON</strong> — your ${s.models.length} models will be called in parallel and their answers voted token-by-token.`
-          : `Single model mode. To enable <strong>Mixture-of-Experts</strong> (parallel models + per-token vote), add a 2nd model.`;
-        return {
-          step: 3, icon: '▶️', title: 'Run the first annotation',
-          body: `Click <strong>Annotate all</strong> in the toolbar. The ${s.icl_pool.size} ICL examples already in the pool will be sent as few-shot context. ${moeNote}`,
-          actions: [
-            { label: '▶ Annotate all', handler: 'annotateAll' },
-            { label: 'Add a 2nd model (MoE)', handler: 'modal', arg: 'models', show: s.models.length < 2 },
-          ].filter(a => a.show !== false),
-        };
-      }
-      if (totalDis > 0) {
-        const moeMsg = lastWasMoE
-          ? `Each ⚠ amber token has at least one field where your models disagreed. Click it to see <em>which model said what</em> and pick the right answer (or click <kbd>adopt</kbd> next to one model).`
-          : `Click a token to edit it: change its tag, lemma, or any field. With keyboard: <kbd>e</kbd> to edit, <kbd>↵</kbd> to save & auto-advance to the next ⚠.`;
-        return {
-          step: 4, icon: '⚠', title: `Review ${totalDis} disagreement${totalDis !== 1 ? 's' : ''}`,
-          body: moeMsg,
-          actions: [
-            { label: 'Open first ⚠', handler: 'jumpToFirstDisagreement' },
-          ],
-        };
-      }
-      if (s.icl_pool.entries.filter(e => e.source === 'corrected').length === 0 && anyDone) {
-        return {
-          step: 5, icon: '📥', title: 'Feed corrections back to ICL',
-          body: 'Your sentences look consensual. To bootstrap: click <strong>📥 to ICL</strong> on any sentence to add its (corrected) annotation to the few-shot pool. Subsequent runs will reuse it. <strong>This is how the loop closes.</strong> Then export, or load more sentences.',
-          actions: [
-            { label: '⬇ Export the corpus', handler: 'modal', arg: 'exports' },
-          ],
-        };
-      }
-      return {
-        step: 5, icon: '✅', title: 'Loop closed — export or continue',
-        body: `Your ICL pool now has <strong>${s.icl_pool.size}</strong> entries (version <strong>v${s.icl_pool.version}</strong>). Re-run on more sentences and they will benefit from your corrections. Or export the corpus in TSV / JSON / CoNLL-U / JSONL.`,
-        actions: [
-          { label: '⬇ Export', handler: 'modal', arg: 'exports' },
-          { label: 'Paste more text', handler: 'modal', arg: 'paste' },
-        ],
-      };
-    },
-    runGuideAction(a) {
-      if (a.handler === 'modal') { this.modal = a.arg; return; }
-      if (a.handler === 'loadExercise') { this.loadExercise(a.arg); return; }
-      if (a.handler === 'annotateAll') { this.annotateAll(); return; }
-      if (a.handler === 'openExternal') { window.open(a.arg, '_blank'); return; }
-      if (a.handler === 'jumpToFirstDisagreement') {
-        for (let i = 0; i < this.state.sentences.length; i++) {
-          const ds = this.state.sentences[i].disagreements || [];
-          if (ds.length > 0) {
-            const t = ds.sort((x, y) => x.token_idx - y.token_idx)[0].token_idx;
-            this.openTokenEditor(i, t);
-            return;
-          }
-        }
-      }
-    },
-    allDisplayableModels() {
-      const set = new Set(this.state.curated_models);
-      for (const m of this.state.models) set.add(m);
-      return Array.from(set);
-    },
-    tokenTooltip(sent, tidx) {
-      const tok = sent.tokens[tidx];
-      const lines = [`${tok.surface}`];
-      for (const f of (this.state.schema?.fields || [])) {
-        const v = tok[f.name];
-        if (v && typeof v !== 'object') lines.push(`${f.name}: ${v}`);
-      }
-      const dis = (sent.disagreements || []).filter(d => d.token_idx === tidx);
-      if (dis.length > 0 && Object.keys(sent.per_model || {}).length > 0) {
-        lines.push('');
-        lines.push('Per-model votes:');
-        for (const [m, ann] of Object.entries(sent.per_model)) {
-          const t = (ann.tokens || [])[tidx] || {};
-          const enums = (this.state.schema?.fields || []).filter(f => f.type === 'enum' && f.name !== 'confidence');
-          const tag = enums[0] ? (t[enums[0].name] ?? '∅') : '';
-          const lemma = t.lemma ? ` ${t.lemma}` : '';
-          lines.push(`  • ${this.modelShort(m)}: ${tag}${lemma}`);
-        }
-      } else if (tok._corrected) {
-        lines.push('(corrected by you)');
-      }
-      return lines.join('\n');
-    },
-    async refresh() {
-      const r = await fetch('/api/state');
-      const data = await r.json();
-      this.applyState(data);
-    },
-    rev: 0,  // bumped on every state mutation; used as x-for :key suffix to force re-render
-    // Mutate state property-by-property and replace nested arrays with fresh references,
-    // so Alpine reactivity detects every change (replacing `state` wholesale can silently
-    // miss deep updates in x-for / :class bindings).
-    applyState(newState) {
-      if (!newState) return;
-      for (const k of Object.keys(newState)) {
-        const v = newState[k];
-        this.state[k] = Array.isArray(v) ? v.slice() : v;
-      }
-      this.rev++;
-    },
-    replaceSentence(sidx, sent) {
-      const arr = this.state.sentences.slice();
-      arr[sidx] = sent;
-      this.state.sentences = arr;
-      this.rev++;
-    },
-    // ----------- helpers -----------
-    primaryTag(tok) {
-      // pick the most informative field for the chip label
-      if (!this.state.schema) return '';
-      const enums = this.state.schema.fields.filter(f => f.type === 'enum' && f.name !== 'confidence');
-      if (enums.length > 0) {
-        const v = tok[enums[0].name];
-        if (v) return v;
-      }
-      // fallback to lemma if string-typed
-      if (tok.lemma) return tok.lemma;
-      return '';
-    },
-    tokenClass(sent, sidx, tidx, tok) {
-      const isFocus = this.focus.sent === sidx && this.focus.tok === tidx;
-      const isSelected = this.selection.has(`${sidx}:${tidx}`);
-      const hasDisagreement = (sent.disagreements || []).some(d => d.token_idx === tidx);
-      const hasContent = this.primaryTag(tok);
-      const corrected = !!tok._corrected;
-      let cls = 'token-base ';
-      if (hasDisagreement) cls += 'token-warn ';
-      else if (corrected) cls += 'token-corrected ';
-      else if (hasContent) cls += 'token-done ';
-      else cls += 'token-pending ';
-      if (isFocus) cls += 'token-focus ';
-      if (isSelected) cls += 'token-selected ';
-      return cls;
-    },
-    modelShort(m) {
-      const parts = m.split('/');
-      return parts[parts.length - 1];
-    },
-    // Per-model accuracy on a single sentence, ONLY shown after the user has
-    // confirmed the annotation as gold (sent.validated === true). Skips
-    // confidence/comment (same as disagreement counting).
-    modelAccuracy(sent) {
-      if (!sent || sent.status !== 'done' || !sent.validated) return [];
-      const perModel = sent.per_model || {};
-      const modelNames = Object.keys(perModel);
-      if (modelNames.length === 0) return [];
-      const quiet = new Set(['min', 'priority']);
-      const fields = (this.state.schema?.fields || []).filter(f => !quiet.has(f.aggregator));
-      const out = [];
-      for (const m of modelNames) {
-        const tokens = perModel[m].tokens || [];
-        let total = 0, correct = 0;
-        const n = Math.min(tokens.length, sent.tokens.length);
-        for (let i = 0; i < n; i++) {
-          const got = tokens[i] || {};
-          const ref = sent.tokens[i] || {};
-          for (const f of fields) {
-            if (f.type === 'object') {
-              for (const sub of (f.subfields || [])) {
-                const a = (got[f.name] || {})[sub.name] ?? null;
-                const b = (ref[f.name] || {})[sub.name] ?? null;
-                total++;
-                if (a === b) correct++;
-              }
-            } else {
-              const a = got[f.name] ?? null;
-              const b = ref[f.name] ?? null;
-              total++;
-              if (a === b) correct++;
             }
-          }
-        }
-        out.push({ model: m, pct: total > 0 ? Math.round(100 * correct / total) : 0, correct, total });
-      }
-      return out.sort((a, b) => b.pct - a.pct);
-    },
-    accuracyClass(pct) {
-      if (pct >= 90) return 'accuracy-pill-high';
-      if (pct >= 70) return 'accuracy-pill-mid';
-      return 'accuracy-pill-low';
-    },
-    modelTokenSummary(ann, tidx) {
-      const t = (ann.tokens || [])[tidx] || {};
-      const enums = (this.state.schema?.fields || []).filter(f => f.type === 'enum' && f.name !== 'confidence');
-      const lemma = t.lemma ? ` · lemma=${t.lemma}` : '';
-      const tag = enums[0] ? ` · ${enums[0].name}=${t[enums[0].name] ?? '∅'}` : '';
-      const conf = t.confidence ? ` · ${t.confidence}` : '';
-      return `${tag}${lemma}${conf}`;
-    },
-    currentPresetMatches(key) {
-      return this.state.schema?.task_name?.toLowerCase().includes(key.replace(/_/g, ' ').replace('tagset', '').trim());
-    },
-    // ----------- mutations: task / settings / models -----------
-    async setPreset(key) {
-      const r = await fetch('/api/task/preset', { method: 'POST', headers: { 'Content-Type': 'application/json' }, body: JSON.stringify({ key }) });
-      this.applyState(await r.json());
-      this.taskEditor.json = JSON.stringify(this.state.schema, null, 2);
-      this.toast('Task: ' + this.state.schema.task_name, 'ok');
-    },
-    async applyTaskJson() {
-      try {
-        const annotation_schema = JSON.parse(this.taskEditor.json);
-        const r = await fetch('/api/task/schema', { method: 'POST', headers: { 'Content-Type': 'application/json' }, body: JSON.stringify({ annotation_schema }) });
-        if (!r.ok) throw new Error((await r.json()).detail);
-        this.applyState(await r.json());
-        this.toast('Custom schema applied.', 'ok');
-      } catch (e) {
-        this.toast('Invalid schema JSON: ' + e.message, 'error');
-      }
-    },
-    async saveSettings(partial) {
-      const r = await fetch('/api/settings', { method: 'POST', headers: { 'Content-Type': 'application/json' }, body: JSON.stringify(partial) });
-      this.applyState(await r.json());
-    },
-    async setProvider(p) {
-      if (!this.state.providers.includes(p)) return;
-      await this.saveSettings({ provider: p });
-      this.toast(`Provider: ${p}. Models reset to its defaults.`, 'ok');
-    },
-    saveKey() {
-      const k = (this.keyEditor.value || '').trim();
-      if (!k) {
-        if (this.localKey) {
-          this.toast('No new key entered. Existing key kept.', 'warn');
-        } else {
-          this.toast('Paste a key first.', 'warn');
-        }
-        return;
-      }
-      this.setLocalKey(k);
-      this.keyEditor.value = '';
-      this.keyEditor.result = '';
-      this.keyEditor.ok = false;
-      this.toast(`✓ ${this.state.provider} key saved in this tab (${k.length} chars). Pill above should turn green.`, 'ok');
-      this.closeModal();
-    },
-    clearKey() {
-      this.setLocalKey('');
-      this.keyEditor.value = '';
-      this.keyEditor.result = '';
-      this.keyEditor.ok = false;
-      this.toast(`${this.state.provider} key cleared from this tab.`, 'ok');
-    },
-    async testKey(autoSaveOnSuccess = false) {
-      const k = (this.keyEditor.value || this.localKey || '').trim();
-      if (!k) { this.keyEditor.result = 'Paste a key first.'; this.keyEditor.ok = false; return; }
-      this.keyEditor.testing = true;
-      this.keyEditor.result = '';
-      try {
-        const r = await fetch('/api/settings/test_key', { method: 'POST', headers: { 'Content-Type': 'application/json' }, body: JSON.stringify({ api_key: k, provider: this.state.provider }) });
-        const j = await r.json();
-        this.keyEditor.ok = j.ok;
-        this.keyEditor.result = (j.ok ? '✓ ' : '✗ ') + j.message;
-        if (j.ok && autoSaveOnSuccess) {
-          this.setLocalKey(k);
-          this.keyEditor.value = '';
-          this.toast(`✓ ${this.state.provider} key tested & saved (${k.length} chars).`, 'ok');
-        }
-      } catch (e) {
-        this.keyEditor.ok = false;
-        this.keyEditor.result = '✗ ' + e.message;
-      }
-      this.keyEditor.testing = false;
-    },
-    async toggleModel(m) {
-      const set = new Set(this.state.models);
-      if (set.has(m)) set.delete(m); else set.add(m);
-      await this.saveSettings({ models: Array.from(set) });
-    },
-    async addCustomModel() {
-      const slug = (this.modelEditor.custom || '').trim();
-      if (!slug) return;
-      const set = new Set(this.state.models);
-      set.add(slug);
-      await this.saveSettings({ models: Array.from(set) });
-      this.modelEditor.custom = '';
-    },
-    async saveAdvanced() {
-      await this.saveSettings({
-        n_icl: this.advEditor.n_icl,
-        temperature: this.advEditor.temperature,
-        system_prompt: this.advEditor.system_prompt,
-        user_template: this.advEditor.user_template,
-      });
-      this.toast('Advanced settings saved.', 'ok');
-      this.closeModal();
-    },
-    // ----------- corpus loading -----------
-    async loadExercise(idx) {
-      this.loading = true;
-      try {
-        const r = await fetch('/api/corpus/exercise', { method: 'POST', headers: { 'Content-Type': 'application/json' }, body: JSON.stringify({ idx }) });
-        this.applyState(await r.json());
-        this.taskEditor.json = JSON.stringify(this.state.schema, null, 2);
-        this.toast(`Loaded: ${this.state.exercises[idx].title}`, 'ok');
-      } finally { this.loading = false; }
-    },
-    onTagKeydown(e) {
-      if (e.key === 'Enter' || e.key === ',' || e.key === ';') {
-        e.preventDefault();
-        this.addCustomTag();
-      }
-    },
-    addCustomTag() {
-      const raw = (this.pasteEditor.customTagInput || '').trim();
-      if (!raw) return;
-      const parts = raw.split(/[,;\n\t]+/).map(t => t.trim()).filter(Boolean);
-      for (const t of parts) {
-        if (!this.pasteEditor.customTags.includes(t)) {
-          this.pasteEditor.customTags.push(t);
-        }
-      }
-      this.pasteEditor.customTagInput = '';
-    },
-    buildCustomSchema() {
-      const fields = [];
-      const baseTags = this.pasteEditor.customTags.slice();
-      const values = this.pasteEditor.includeNone
-        ? (baseTags.includes('O') ? baseTags : ['O', ...baseTags])
-        : baseTags;
-      fields.push({
-        name: 'tag',
-        type: 'enum',
-        values,
-        nullable: false,
-        aggregator: 'vote',
-        subfields: [],
-      });
-      if (this.pasteEditor.includeConfidence) {
-        fields.push({ name: 'confidence', type: 'enum', values: ['low', 'medium', 'high'], nullable: false, aggregator: 'min', subfields: [] });
-      }
-      if (this.pasteEditor.includeComment) {
-        fields.push({ name: 'comment', type: 'string', values: [], nullable: true, aggregator: 'priority', subfields: [] });
-      }
-      return {
-        task_name: this.pasteEditor.customTaskName || 'Custom task',
-        language: this.pasteEditor.language || '',
-        description: '',
-        fields,
-      };
-    },
-    async loadPaste() {
-      // flush any pending tag still in the input
-      if ((this.pasteEditor.customTagInput || '').trim()) this.addCustomTag();
-      this.loading = true;
-      try {
-        // 1) Set the task BEFORE loading text (so the ICL pool & state are consistent)
-        if (this.pasteEditor.presetKey === 'custom') {
-          if (this.pasteEditor.customTags.length === 0) {
-            this.toast('Add at least one tag in the custom set.', 'warn');
-            return;
-          }
-          const annotation_schema = this.buildCustomSchema();
-          const r0 = await fetch('/api/task/schema', { method: 'POST', headers: { 'Content-Type': 'application/json' }, body: JSON.stringify({ annotation_schema }) });
-          if (!r0.ok) { this.toast('Schema rejected: ' + (await r0.json()).detail, 'error'); return; }
-          this.applyState(await r0.json());
-        } else if (this.pasteEditor.presetKey) {
-          const r0 = await fetch('/api/task/preset', { method: 'POST', headers: { 'Content-Type': 'application/json' }, body: JSON.stringify({ key: this.pasteEditor.presetKey }) });
-          if (r0.ok) this.applyState(await r0.json());
-        }
-        // 2) Load the text
-        const r = await fetch('/api/corpus/paste', { method: 'POST', headers: { 'Content-Type': 'application/json' }, body: JSON.stringify({
-          text: this.pasteEditor.text,
-          tokenizer: this.pasteEditor.tokenizer,
-          language: this.pasteEditor.language,
-        }) });
-        this.applyState(await r.json());
-        this.closeModal();
-        this.toast(`Loaded ${this.state.sentences.length} sentence(s). Task: ${this.state.schema?.task_name}.`, 'ok');
-      } finally { this.loading = false; }
-    },
-    async clearCorpus() {
-      const r = await fetch('/api/corpus/clear', { method: 'POST' });
-      this.applyState(await r.json());
-    },
-    async resetAll() {
-      if (!confirm('Reset everything? This wipes:\n• loaded corpus\n• annotations\n• ICL pool\n• custom task/schema\n• prompt overrides\n\nYour API key (browser-only) is kept.')) return;
-      this.loading = true;
-      try {
-        const r = await fetch('/api/reset', { method: 'POST' });
-        this.applyState(await r.json());
-        this.selection = new Set();
-        this.focus = { sent: null, tok: null };
-        this.modal = null;
-        this.toast('Workspace reset.', 'ok');
-      } finally { this.loading = false; }
-    },
-    async clearIcl() {
-      const r = await fetch('/api/icl/clear', { method: 'POST' });
-      this.applyState(await r.json());
-    },
-    // ----------- annotation -----------
-    async annotateAll() {
-      if (!this.canRun || this.loading) return;
-      this.loading = true;
-      this.progressText = `Annotating ${this.state.sentences.length} sentences…`;
-      // optimistic: mark all pending sentences as annotating
-      this.state.sentences.forEach(s => { if (s.status !== 'done') s.status = 'annotating'; });
-      try {
-        const r = await fetch('/api/annotate', { method: 'POST', headers: { 'Content-Type': 'application/json', ...this.keyHeaders() }, body: JSON.stringify({}) });
-        if (!r.ok) throw new Error((await r.json()).detail);
-        this.applyState(await r.json());
-        const dis = this.totalDisagreements;
-        this.toast(`Done. ${dis} disagreement${dis !== 1 ? 's' : ''} to review.`, dis > 0 ? 'warn' : 'ok');
-      } catch (e) {
-        this.toast(e.message, 'error');
-      } finally { this.loading = false; }
-    },
-    async annotateOne(sidx) {
-      if (!this.hasKey) { this.modal = 'key'; return; }
-      this.loading = true;
-      this.state.sentences[sidx].status = 'annotating';
-      try {
-        const r = await fetch('/api/annotate', { method: 'POST', headers: { 'Content-Type': 'application/json', ...this.keyHeaders() }, body: JSON.stringify({ sentence_idxs: [sidx] }) });
-        if (!r.ok) throw new Error((await r.json()).detail);
-        this.applyState(await r.json());
-        const s = this.state.sentences[sidx];
-        this.toast(`Sentence ${s.id}: ${s.n_disagreements} disagreement(s).`, s.n_disagreements > 0 ? 'warn' : 'ok');
-      } catch (e) { this.toast(e.message, 'error'); }
-      this.loading = false;
-    },
-    async addSentenceToIcl(sidx) {
-      const r = await fetch(`/api/sentence/${sidx}/add_to_icl`, { method: 'POST' });
-      this.applyState(await r.json());
-      this.toast(`Added to ICL pool (v${this.state.icl_pool.version}, ${this.state.icl_pool.size} entries).`, 'ok');
-    },
-    async setValidated(sidx, value) {
-      const r = await fetch(`/api/sentence/${sidx}/validate`, {
         method: 'POST',
-        headers: { 'Content-Type': 'application/json' },
-        body: JSON.stringify({ value }),
-      });
-      if (!r.ok) { this.toast('Could not toggle scoring.', 'error'); return; }
-      const sent = await r.json();
-      this.replaceSentence(sidx, sent);
-      this.toast(value ? '📊 Showing per-model accuracy vs your current annotation.' : 'Scores hidden.', 'ok');
-    },
-    // ----------- token editor -----------
-    onTokenClick(ev, sidx, tidx) {
-      if (ev.shiftKey) {
-        this.toggleSelectionIdx(sidx, tidx);
         return;
-      }
-      this.openTokenEditor(sidx, tidx);
-    },
-    openTokenEditor(sidx, tidx) {
-      const sent = this.state.sentences[sidx];
-      const tok = JSON.parse(JSON.stringify(sent.tokens[tidx] || {}));
-      this.editor.sidx = sidx;
-      this.editor.tidx = tidx;
-      this.editor.tok = tok;
-      this.editor.original = JSON.parse(JSON.stringify(tok));  // snapshot for diff
-      this.editor.search = {};
-      this.editor.filtered = {};
-      this.editor.perModel = sent.per_model || {};
-      this.editor.disagreementCells = (sent.disagreements || []).filter(d => d.token_idx === tidx);
-      this.editor.propagateToSimilar = false;
-      this.focus = { sent: sidx, tok: tidx };
-      this.modal = 'token';
-    },
-    matchingTokenCount() {
-      if (!this.editor.tok) return 0;
-      const surf = this.editor.tok.surface;
-      let n = 0;
-      for (let s = 0; s < this.state.sentences.length; s++) {
-        for (let t = 0; t < this.state.sentences[s].tokens.length; t++) {
-          if (s === this.editor.sidx && t === this.editor.tidx) continue;
-          if (this.state.sentences[s].tokens[t].surface === surf) n++;
-        }
-      }
-      return n;
-    },
-    fieldChanges() {
-      const out = {};
-      if (!this.editor.tok || !this.editor.original) return out;
-      for (const k of Object.keys(this.editor.tok)) {
-        if (k === 'surface' || k.startsWith('_')) continue;
-        const a = JSON.stringify(this.editor.tok[k] ?? null);
-        const b = JSON.stringify(this.editor.original[k] ?? null);
-        if (a !== b) out[k] = this.editor.tok[k];
-      }
-      return out;
-    },
-    fieldChangesSummary() {
-      const c = this.fieldChanges();
-      return Object.entries(c).map(([k, v]) => {
-        const val = (v === null || v === undefined) ? '∅' : (typeof v === 'object' ? JSON.stringify(v) : String(v));
-        return `${k}=${val}`;
-      }).join(', ');
-    },
-    refreshFilter(name, values) {
-      const q = (this.editor.search[name] || '').toLowerCase();
-      this.editor.filtered[name] = values.filter(v => v.toLowerCase().includes(q));
-    },
-    adoptFromModel(model) {
-      const sent = this.state.sentences[this.editor.sidx];
-      const t = (sent.per_model[model]?.tokens || [])[this.editor.tidx];
-      if (!t) return;
-      // copy all fields except surface
-      const surface = this.editor.tok.surface;
-      this.editor.tok = { ...t, surface };
-      this.toast(`Adopted from ${this.modelShort(model)}.`, 'ok');
-    },
-    async reaskOneToken(model) {
-      try {
-        const r = await fetch('/api/annotate/token', { method: 'POST', headers: { 'Content-Type': 'application/json', ...this.keyHeaders() }, body: JSON.stringify({
-          sent: this.editor.sidx, tok: this.editor.tidx, model,
-        }) });
-        if (!r.ok) throw new Error((await r.json()).detail);
-        const sent = await r.json();
-        this.replaceSentence(this.editor.sidx, sent);
-        // re-open with the new token
-        this.openTokenEditor(this.editor.sidx, this.editor.tidx);
-        this.toast(`Re-asked ${this.modelShort(model)}.`, 'ok');
-      } catch (e) { this.toast(e.message, 'error'); }
-    },
-    async reaskOneTokenAt(sidx, tidx, model) {
-      this.editor.sidx = sidx; this.editor.tidx = tidx;
-      await this.reaskOneToken(model);
-    },
-    async saveToken() {
-      const sidx = this.editor.sidx, tidx = this.editor.tidx;
-      const surface = this.editor.tok.surface;
-      const changes = this.fieldChanges();
-      const wantPropagate = this.editor.propagateToSimilar && Object.keys(changes).length > 0 && this.matchingTokenCount() > 0;
-      this.editor.tok._corrected = true;
-      const r = await fetch(`/api/sentence/${sidx}/token/${tidx}`, { method: 'POST', headers: { 'Content-Type': 'application/json' }, body: JSON.stringify({ token: this.editor.tok }) });
-      if (!r.ok) { this.toast('Save failed.', 'error'); return; }
-      const sent = await r.json();
-      this.replaceSentence(sidx, sent);
-      let propagatedCount = 0;
-      if (wantPropagate) {
         try {
-          const r2 = await fetch('/api/bulk_similar', {
-            method: 'POST',
-            headers: { 'Content-Type': 'application/json' },
-            body: JSON.stringify({
-              surface,
-              updates: changes,
-              exclude: [{ s: sidx, t: tidx }],
-            }),
-          });
-          if (r2.ok) {
-            const j = await r2.json();
-            this.applyState(j.state);
-            propagatedCount = (j.affected || []).length;
-          }
         } catch (e) {
-          this.toast('Propagation failed: ' + e.message, 'error');
         }
-      }
-      // auto-advance
-      if (this.editor.autoAdvance) {
         const next = this.findNextDisagreement(sidx, tidx);
         if (next) {
-          this.openTokenEditor(next.s, next.t);
-          if (propagatedCount > 0) this.toast(`✓ Saved + propagated to ${propagatedCount} other "${surface}".`, 'ok');
-          return;
-        }
-      }
-      this.closeModal();
-      this.toast(propagatedCount > 0 ? `✓ Saved + propagated to ${propagatedCount} other "${surface}".` : '✓ Saved.', 'ok');
-    },
-    findNextDisagreement(sidx, tidx) {
-      const sents = this.state.sentences;
-      // search rest of current sentence
-      const sent = sents[sidx];
-      const more = (sent.disagreements || []).filter(d => d.token_idx > tidx).sort((a, b) => a.token_idx - b.token_idx);
-      if (more.length > 0) return { s: sidx, t: more[0].token_idx };
-      // next sentences
-      for (let i = sidx + 1; i < sents.length; i++) {
-        const ds = sents[i].disagreements || [];
-        if (ds.length > 0) {
-          const t = ds.sort((a, b) => a.token_idx - b.token_idx)[0].token_idx;
-          return { s: i, t };
-        }
-      }
-      return null;
-    },
-    moveToken(delta) {
-      const sent = this.state.sentences[this.editor.sidx];
-      const next = this.editor.tidx + delta;
-      if (next < 0 || next >= sent.tokens.length) return;
-      this.openTokenEditor(this.editor.sidx, next);
-    },
-    // ----------- selection / bulk -----------
-    toggleSelectionIdx(sidx, tidx) {
-      const k = `${sidx}:${tidx}`;
-      if (this.selection.has(k)) this.selection.delete(k);
-      else this.selection.add(k);
-      // alpine reactivity: replace Set
-      this.selection = new Set(this.selection);
-    },
-    clearSelection() { this.selection = new Set(); },
-    bulkSelectedField() {
-      return this.schemaFields.find(f => f.name === this.bulkEditor.field);
-    },
-    async applyBulk() {
-      const bySent = {};
-      for (const k of this.selection) {
-        const [s, t] = k.split(':').map(Number);
-        if (!bySent[s]) bySent[s] = [];
-        bySent[s].push(t);
-      }
-      for (const [s, idxs] of Object.entries(bySent)) {
-        const r = await fetch(`/api/sentence/${s}/bulk`, { method: 'POST', headers: { 'Content-Type': 'application/json' }, body: JSON.stringify({
-          token_idxs: idxs, field: this.bulkEditor.field, value: this.bulkEditor.value,
-        }) });
-        if (r.ok) this.replaceSentence(Number(s), await r.json());
-      }
-      this.clearSelection();
-      this.closeModal();
-      this.toast('Bulk applied.', 'ok');
-    },
-    // ----------- context menu -----------
-    openTokenContext(ev, sidx, tidx) {
-      this.ctxMenu = { open: true, x: ev.clientX, y: ev.clientY, s: sidx, t: tidx };
-    },
-    // ----------- modals -----------
-    closeModal() {
-      this.modal = null;
-      this.editor.sidx = null; this.editor.tidx = null; this.editor.tok = null;
-    },
-    // ----------- keyboard -----------
-    globalKey(e) {
-      // editor-modal: route to editor keys
-      if (this.modal === 'token' && this.editor.tok) {
-        if (e.key === 'Escape') { this.closeModal(); e.preventDefault(); return; }
-        if (e.key === 'Enter' && !(e.target.tagName === 'INPUT' || e.target.tagName === 'TEXTAREA')) {
-          this.saveToken(); e.preventDefault(); return;
-        }
-        if (e.key === 'ArrowLeft') { this.moveToken(-1); e.preventDefault(); return; }
-        if (e.key === 'ArrowRight') { this.moveToken(1); e.preventDefault(); return; }
-        // 1-9 → assign primary enum
-        const num = parseInt(e.key);
-        if (!isNaN(num) && num >= 1 && num <= 9) {
-          const enums = this.schemaFields.filter(f => f.type === 'enum' && f.name !== 'confidence');
-          if (enums.length > 0) {
-            const f = enums[0];
-            const visible = this.editor.filtered[f.name] || f.values;
-            const v = visible[num - 1];
-            if (v) { this.editor.tok[f.name] = v; e.preventDefault(); }
-          }
         }
-        return;
-      }
-      if (this.modal) {
-        if (e.key === 'Escape') { this.closeModal(); e.preventDefault(); }
-        return;
-      }
-      if (e.target.tagName === 'INPUT' || e.target.tagName === 'TEXTAREA') return;
-      // global shortcuts
-      if (e.key === 'j') { this.moveFocus(1); e.preventDefault(); }
-      else if (e.key === 'k') { this.moveFocus(-1); e.preventDefault(); }
-      else if (e.key === 'e' || e.key === 'Enter') {
-        if (this.focus.sent !== null) { this.openTokenEditor(this.focus.sent, this.focus.tok); e.preventDefault(); }
-      }
-      else if (e.key === 'x') {
-        if (this.focus.sent !== null) { this.toggleSelectionIdx(this.focus.sent, this.focus.tok); e.preventDefault(); }
-      }
-      else if (e.key === 'r') {
-        if (this.focus.sent !== null) { this.annotateOne(this.focus.sent); e.preventDefault(); }
-      }
-      else if (e.key === 'Escape') { this.clearSelection(); }
-    },
-    handleKey(e) { /* main panel passthrough — globalKey handles all */ },
-    moveFocus(delta) {
-      const sents = this.state.sentences;
-      if (sents.length === 0) return;
-      if (this.focus.sent === null) {
-        this.focus = { sent: 0, tok: 0 };
-        return;
-      }
-      let s = this.focus.sent, t = this.focus.tok + delta;
-      while (s >= 0 && s < sents.length) {
-        if (t < 0) { s -= 1; if (s < 0) return; t = sents[s].tokens.length - 1; continue; }
-        if (t >= sents[s].tokens.length) { s += 1; t = 0; continue; }
-        this.focus = { sent: s, tok: t };
-        // scroll into view
-        this.$nextTick(() => {
-          const el = document.querySelector(`button.token-base[data-sent="${s}"][data-tok="${t}"]`);
-          if (el) el.scrollIntoView({ block: 'center', behavior: 'smooth' });
-        });
-        return;
-      }
-    },
-    // ----------- toasts -----------
-    toast(msg, kind = 'ok') {
-      const id = this.nextToastId++;
-      this.toasts.push({ id, msg, kind });
-      setTimeout(() => { this.toasts = this.toasts.filter(t => t.id !== id); }, 3500);
-    },
-    // ----------- markdown -> html (minimal) -----------
-    markdownToHtml(md) {
-      // very lightweight; safe enough for trusted local content
-      let h = md
-        .replace(/&/g, '&amp;').replace(/</g, '&lt;').replace(/>/g, '&gt;')
-        .replace(/^### (.*)$/gm, '<h3>$1</h3>')
-        .replace(/^## (.*)$/gm, '<h2>$1</h2>')
-        .replace(/^# (.*)$/gm, '<h1>$1</h1>')
-        .replace(/\*\*(.+?)\*\*/g, '<strong>$1</strong>')
-        .replace(/`([^`]+)`/g, '<code>$1</code>')
-        .replace(/^- (.*)$/gm, '<li>$1</li>')
-        .replace(/^\d+\. (.*)$/gm, '<li>$1</li>');
-      h = h.replace(/(<li>.*<\/li>\n?)+/g, m => '<ul>' + m + '</ul>');
-      h = h.split(/\n{2,}/).map(p => /^<[hul]/.test(p) ? p : '<p>' + p.replace(/\n/g, '<br>') + '</p>').join('\n');
-      return h;
-    },
-  };
 }

 // LREC 2026 — LLM Annotator front-end logic (Alpine.js)
 function annotator() {
+    return {
+        // ----------- state -----------
+        paperLink: 'https://aclanthology.org/2026.loreslm-1.28/',
+        loading: false,
+        progressText: 'Annotating…',
+        modal: null,
+        cheatsheetHtml: '',
+        toasts: [],
+        nextToastId: 1,
+        focus: {sent: null, tok: null},
+        selection: new Set(),
+        ctxMenu: {open: false, x: 0, y: 0, s: null, t: null},
+        guideDismissed: false,
+        moeBannerDismissed: false,
+        moeHintDismissed: false,
+        // Per-provider client-side keys; persisted in sessionStorage only
+        localKeys: {openrouter: '', mistral: '', openai: '', ilaas: ''},
+        state: {
+            schema: null,
+            schema_hash: '',
+            json_schema: {},
+            language: '',
+            system_prompt: '',
+            user_template: '',
+            has_env_key: false,
+            provider: 'openrouter',
+            providers: ['openrouter', 'mistral', 'openai', 'ilaas'],
+            curated_models_by_provider: {},
+            models: [],
+            priority: [],
+            temperature: 0,
+            n_icl: 5,
+            icl_pool: {version: 0, size: 0, entries: []},
+            sentences: [],
+            presets: [],
+            curated_models: [],
+            aggregators: [],
+            exercises: [],
+        },
+        editor: {
+            sidx: null, tidx: null,
+            tok: null,
+            original: null,            // snapshot at modal-open, used to diff field changes
+            perModel: {},
+            disagreementCells: [],
+            search: {},
+            filtered: {},
+            autoAdvance: true,
+            propagateToSimilar: false,
+        },
+        taskEditor: {json: ''},
+        modelEditor: {custom: '', priority: ''},
+        keyEditor: {value: '', testing: false, result: '', ok: false},
+        pasteEditor: {
+            text: '',
+            tokenizer: 'whitespace',
+            language: '',
+            presetKey: 'ud_upos_morph',
+            customTaskName: 'My custom task',
+            customTagInput: '',
+            customTags: [],
+            includeNone: true,
+            includeConfidence: true,
+            includeComment: false,
+        },
+        advEditor: {system_prompt: '', user_template: '', n_icl: 5, temperature: 0},
+        bulkEditor: {field: '', value: ''},
+        // ----------- derived -----------
+        get schema() {
+            return this.state.schema;
+        },
+        get schemaFields() {
+            const f = (this.state.schema && this.state.schema.fields) || [];
+            return f;
+        },
+        get totalTokens() {
+            return this.state.sentences.reduce((a, s) => a + s.tokens.length, 0);
+        },
+        get totalDisagreements() {
+            return this.state.sentences.reduce((a, s) => a + (s.n_disagreements || 0), 0);
+        },
+        // ----------- key helpers (per-provider) -----------
+        get localKey() {
+            return this.localKeys[this.state.provider] || '';
+        },
+        setLocalKey(value) {
+            const p = this.state.provider;
+            this.localKeys = {...this.localKeys, [p]: value};
+            try {
+                sessionStorage.setItem('llm_keys', JSON.stringify(this.localKeys));
+            } catch (e) {
             }
+        },
+        get hasKey() {
+            return !!this.localKey || !!this.state.has_env_key;
+        },
+        get canRun() {
+            return this.hasKey && this.state.models.length > 0 && this.state.sentences.length > 0;
+        },
+        keyHeaders() {
+            const h = {'X-LLM-Provider': this.state.provider};
+            if (this.localKey) h['X-API-Key'] = this.localKey;
+            return h;
+        },
+        // ----------- init -----------
+        async init() {
+            this.guideDismissed = localStorage.getItem('guideDismissed') === '1';
+            this.moeBannerDismissed = localStorage.getItem('moeBannerDismissed') === '1';
+            this.moeHintDismissed = localStorage.getItem('moeHintDismissed') === '1';
+            // Load per-provider keys; migrate legacy single-key key if present
+            try {
+                const raw = sessionStorage.getItem('llm_keys');
+                if (raw) {
+                    this.localKeys = {
+                        openrouter: '',
+                        mistral: '',
+                        openai: '',
+                        ilaas: '',
+                        ...JSON.parse(raw),
+                    };
+                }
+                const legacy = sessionStorage.getItem('openrouter_key');
+                if (legacy && !this.localKeys.openrouter) {
+                    this.localKeys = {...this.localKeys, openrouter: legacy};
+                    sessionStorage.setItem('llm_keys', JSON.stringify(this.localKeys));
+                    sessionStorage.removeItem('openrouter_key');
+                }
+            } catch (e) {
+            }
+            await this.refresh();
+            try {
+                const r = await fetch('/api/cheatsheet');
+                const txt = await r.text();
+                this.cheatsheetHtml = this.markdownToHtml(txt);
+            } catch (e) {
+            }
+            // sync editor mirrors
+            this.taskEditor.json = JSON.stringify(this.state.schema, null, 2);
+            this.modelEditor.priority = this.state.priority.join(', ');
+            this.advEditor.system_prompt = this.state.system_prompt;
+            this.advEditor.user_template = this.state.user_template;
+            this.advEditor.n_icl = this.state.n_icl;
+            this.advEditor.temperature = this.state.temperature;
+            window.addEventListener('keydown', (e) => this.globalKey(e));
+            // persist dismissals
+            this.$watch?.('moeBannerDismissed', v => localStorage.setItem('moeBannerDismissed', v ? '1' : '0'));
+            this.$watch?.('moeHintDismissed', v => localStorage.setItem('moeHintDismissed', v ? '1' : '0'));
+        },
+        // ----------- contextual guide -----------
+        get guide() {
+            const s = this.state;
+            if (s.sentences.length === 0) {
+                return {
+                    step: 1, icon: '📜', title: 'Load a corpus to start',
+                    body: 'Pick a sandbox example in the left sidebar — Greek, Armenian or Syriac. They come with a task preset, a validated tagset, and 3–5 pre-loaded ICL examples (visible in the toolbar: <strong>ICL pool · v3 · 5 ex</strong>).',
+                    actions: [
+                        {label: '📘 Try Armenian (HYE)', handler: 'loadExercise', arg: 1},
+                        {label: 'Paste my own text', handler: 'modal', arg: 'paste'},
+                    ],
+                };
+            }
+            if (!this.hasKey) {
+                const providerLabel = s.provider || 'provider';
+                const body = s.provider === 'openrouter'
+                    ? 'One OpenRouter key gives you access to Claude, GPT, Mistral, Llama, Qwen, DeepSeek and more. The key is kept <strong>in this browser tab only</strong>...'
+                    : `Add your <strong>${providerLabel}</strong> API key. The key is kept <strong>in this browser tab only</strong> and sent as an <code>X-API-Key</code> header.`;
+                return {
+                    step: 2,
+                    icon: '🔑',
+                    title: `Add your ${providerLabel} API key`,
+                    body,
+                    actions: [
+                        {label: 'Add API key', handler: 'modal', arg: 'key'},
+                    ],
+                };
+            }
+            const anyDone = s.sentences.some(x => x.status === 'done');
+            const anyPending = s.sentences.some(x => x.status === 'pending');
+            const totalDis = this.totalDisagreements;
+            const lastWasMoE = s.sentences.some(x => Object.keys(x.per_model || {}).length >= 2);
+            if (!anyDone) {
+                const moeNote = s.models.length >= 2
+                    ? `<strong>MoE is ON</strong> — your ${s.models.length} models will be called in parallel and their answers voted token-by-token.`
+                    : `Single model mode. To enable <strong>Mixture-of-Experts</strong> (parallel models + per-token vote), add a 2nd model.`;
+                return {
+                    step: 3, icon: '▶️', title: 'Run the first annotation',
+                    body: `Click <strong>Annotate all</strong> in the toolbar. The ${s.icl_pool.size} ICL examples already in the pool will be sent as few-shot context. ${moeNote}`,
+                    actions: [
+                        {label: '▶ Annotate all', handler: 'annotateAll'},
+                        {label: 'Add a 2nd model (MoE)', handler: 'modal', arg: 'models', show: s.models.length < 2},
+                    ].filter(a => a.show !== false),
+                };
+            }
+            if (totalDis > 0) {
+                const moeMsg = lastWasMoE
+                    ? `Each ⚠ amber token has at least one field where your models disagreed. Click it to see <em>which model said what</em> and pick the right answer (or click <kbd>adopt</kbd> next to one model).`
+                    : `Click a token to edit it: change its tag, lemma, or any field. With keyboard: <kbd>e</kbd> to edit, <kbd>↵</kbd> to save & auto-advance to the next ⚠.`;
+                return {
+                    step: 4, icon: '⚠', title: `Review ${totalDis} disagreement${totalDis !== 1 ? 's' : ''}`,
+                    body: moeMsg,
+                    actions: [
+                        {label: 'Open first ⚠', handler: 'jumpToFirstDisagreement'},
+                    ],
+                };
+            }
+            if (s.icl_pool.entries.filter(e => e.source === 'corrected').length === 0 && anyDone) {
+                return {
+                    step: 5, icon: '📥', title: 'Feed corrections back to ICL',
+                    body: 'Your sentences look consensual. To bootstrap: click <strong>📥 to ICL</strong> on any sentence to add its (corrected) annotation to the few-shot pool. Subsequent runs will reuse it. <strong>This is how the loop closes.</strong> Then export, or load more sentences.',
+                    actions: [
+                        {label: '⬇ Export the corpus', handler: 'modal', arg: 'exports'},
+                    ],
+                };
+            }
+            return {
+                step: 5, icon: '✅', title: 'Loop closed — export or continue',
+                body: `Your ICL pool now has <strong>${s.icl_pool.size}</strong> entries (version <strong>v${s.icl_pool.version}</strong>). Re-run on more sentences and they will benefit from your corrections. Or export the corpus in TSV / JSON / CoNLL-U / JSONL.`,
+                actions: [
+                    {label: '⬇ Export', handler: 'modal', arg: 'exports'},
+                    {label: 'Paste more text', handler: 'modal', arg: 'paste'},
+                ],
+            };
+        },
+        runGuideAction(a) {
+            if (a.handler === 'modal') {
+                this.modal = a.arg;
+                return;
+            }
+            if (a.handler === 'loadExercise') {
+                this.loadExercise(a.arg);
+                return;
+            }
+            if (a.handler === 'annotateAll') {
+                this.annotateAll();
+                return;
+            }
+            if (a.handler === 'openExternal') {
+                window.open(a.arg, '_blank');
+                return;
+            }
+            if (a.handler === 'jumpToFirstDisagreement') {
+                for (let i = 0; i < this.state.sentences.length; i++) {
+                    const ds = this.state.sentences[i].disagreements || [];
+                    if (ds.length > 0) {
+                        const t = ds.sort((x, y) => x.token_idx - y.token_idx)[0].token_idx;
+                        this.openTokenEditor(i, t);
+                        return;
+                    }
+                }
+            }
+        },
+        allDisplayableModels() {
+            const set = new Set(this.state.curated_models);
+            for (const m of this.state.models) set.add(m);
+            return Array.from(set);
+        },
+        tokenTooltip(sent, tidx) {
+            const tok = sent.tokens[tidx];
+            const lines = [`${tok.surface}`];
+            for (const f of (this.state.schema?.fields || [])) {
+                const v = tok[f.name];
+                if (v && typeof v !== 'object') lines.push(`${f.name}: ${v}`);
+            }
+            const dis = (sent.disagreements || []).filter(d => d.token_idx === tidx);
+            if (dis.length > 0 && Object.keys(sent.per_model || {}).length > 0) {
+                lines.push('');
+                lines.push('Per-model votes:');
+                for (const [m, ann] of Object.entries(sent.per_model)) {
+                    const t = (ann.tokens || [])[tidx] || {};
+                    const enums = (this.state.schema?.fields || []).filter(f => f.type === 'enum' && f.name !== 'confidence');
+                    const tag = enums[0] ? (t[enums[0].name] ?? '∅') : '';
+                    const lemma = t.lemma ? ` ${t.lemma}` : '';
+                    lines.push(`  • ${this.modelShort(m)}: ${tag}${lemma}`);
+                }
+            } else if (tok._corrected) {
+                lines.push('(corrected by you)');
+            }
+            return lines.join('\n');
+        },
+        async refresh() {
+            const r = await fetch('/api/state');
+            const data = await r.json();
+            this.applyState(data);
+        },
+        rev: 0,  // bumped on every state mutation; used as x-for :key suffix to force re-render
+        // Mutate state property-by-property and replace nested arrays with fresh references,
+        // so Alpine reactivity detects every change (replacing `state` wholesale can silently
+        // miss deep updates in x-for / :class bindings).
+        applyState(newState) {
+            if (!newState) return;
+            for (const k of Object.keys(newState)) {
+                const v = newState[k];
+                if (k === 'sentences') {
+                    this.state.sentences = (v || []).map(s => ({
+                        ...s,
+                        tokens: (s.tokens || []).map(t => ({...t})),
+                        disagreements: [...(s.disagreements || [])],
+                        per_model: {...(s.per_model || {})},
+                    }));
+                } else if (Array.isArray(v)) {
+                    this.state[k] = [...v];
+                } else if (v && typeof v === 'object') {
+                    this.state[k] = {...v};
+                } else {
+                    this.state[k] = v;
+                }
+            }
+            for (const sent of this.state.sentences || []) {
+                if (sent.validated) {
+                    sent._accuracy = this.modelAccuracy(sent);
+                }
+            }
+            this.rev++;
+        },
+        replaceSentence(sidx, sent) {
+            const arr = [...this.state.sentences];
+            arr[sidx] = {
+                ...sent,
+                tokens: (sent.tokens || []).map(t => ({...t})),
+                disagreements: [...(sent.disagreements || [])],
+                per_model: {...(sent.per_model || {})},
+            };
+            this.state.sentences = arr;
+            this.rev++;
+        },
+        // ----------- helpers -----------
+        primaryTag(tok) {
+            // pick the most informative field for the chip label
+            if (!this.state.schema) return '';
+            const enums = this.state.schema.fields.filter(f => f.type === 'enum' && f.name !== 'confidence');
+            if (enums.length > 0) {
+                const v = tok[enums[0].name];
+                if (v) return v;
+            }
+            // fallback to lemma if string-typed
+            if (tok.lemma) return tok.lemma;
+            return '';
+        },
+        tokenClass(sent, sidx, tidx, tok) {
+            const isFocus = this.focus.sent === sidx && this.focus.tok === tidx;
+            const isSelected = this.selection.has(`${sidx}:${tidx}`);
+            const hasDisagreement = (sent.disagreements || []).some(d => d.token_idx === tidx);
+            const hasContent = this.primaryTag(tok);
+            const corrected = !!tok._corrected;
+            let cls = 'token-base ';
+            if (hasDisagreement) cls += 'token-warn ';
+            else if (corrected) cls += 'token-corrected ';
+            else if (hasContent) cls += 'token-done ';
+            else cls += 'token-pending ';
+            if (isFocus) cls += 'token-focus ';
+            if (isSelected) cls += 'token-selected ';
+            return cls;
+        },
+        modelShort(m) {
+            const parts = m.split('/');
+            return parts[parts.length - 1];
+        },
+        // Per-model accuracy on a single sentence, ONLY shown after the user has
+        // confirmed the annotation as gold (sent.validated === true). Skips
+        // confidence/comment (same as disagreement counting).
+        modelAccuracy(sent) {
+            if (!sent || sent.status !== 'done' || !sent.validated) return [];
+            const perModel = sent.per_model || {};
+            const modelNames = Object.keys(perModel);
+            if (modelNames.length === 0) return [];
+            const quiet = new Set(['min', 'priority']);
+            const fields = (this.state.schema?.fields || []).filter(f => !quiet.has(f.aggregator));
+            const out = [];
+            for (const m of modelNames) {
+                const tokens = perModel[m].tokens || [];
+                let total = 0, correct = 0;
+                const n = Math.min(tokens.length, sent.tokens.length);
+                for (let i = 0; i < n; i++) {
+                    const got = tokens[i] || {};
+                    const ref = sent.tokens[i] || {};
+                    for (const f of fields) {
+                        if (f.type === 'object') {
+                            for (const sub of (f.subfields || [])) {
+                                const a = (got[f.name] || {})[sub.name] ?? null;
+                                const b = (ref[f.name] || {})[sub.name] ?? null;
+                                total++;
+                                if (a === b) correct++;
+                            }
+                        } else {
+                            const a = got[f.name] ?? null;
+                            const b = ref[f.name] ?? null;
+                            total++;
+                            if (a === b) correct++;
+                        }
+                    }
+                }
+                out.push({model: m, pct: total > 0 ? Math.round(100 * correct / total) : 0, correct, total});
+            }
+            return out.sort((a, b) => b.pct - a.pct);
+        },
+        accuracyClass(pct) {
+            if (pct >= 90) return 'accuracy-pill-high';
+            if (pct >= 70) return 'accuracy-pill-mid';
+            return 'accuracy-pill-low';
+        },
+        modelTokenSummary(ann, tidx) {
+            const t = (ann.tokens || [])[tidx] || {};
+            const enums = (this.state.schema?.fields || []).filter(f => f.type === 'enum' && f.name !== 'confidence');
+            const lemma = t.lemma ? ` · lemma=${t.lemma}` : '';
+            const tag = enums[0] ? ` · ${enums[0].name}=${t[enums[0].name] ?? '∅'}` : '';
+            const conf = t.confidence ? ` · ${t.confidence}` : '';
+            return `${tag}${lemma}${conf}`;
+        },
+        currentPresetMatches(key) {
+            return this.state.schema?.task_name?.toLowerCase().includes(key.replace(/_/g, ' ').replace('tagset', '').trim());
+        },
+        // ----------- mutations: task / settings / models -----------
+        async setPreset(key) {
+            const r = await fetch('/api/task/preset', {
+                method: 'POST',
+                headers: {'Content-Type': 'application/json'},
+                body: JSON.stringify({key})
+            });
+            this.applyState(await r.json());
+            this.taskEditor.json = JSON.stringify(this.state.schema, null, 2);
+            this.toast('Task: ' + this.state.schema.task_name, 'ok');
+        },
+        async applyTaskJson() {
+            try {
+                const annotation_schema = JSON.parse(this.taskEditor.json);
+                const r = await fetch('/api/task/schema', {
+                    method: 'POST',
+                    headers: {'Content-Type': 'application/json'},
+                    body: JSON.stringify({annotation_schema})
+                });
+                if (!r.ok) throw new Error((await r.json()).detail);
+                this.applyState(await r.json());
+                this.toast('Custom schema applied.', 'ok');
+            } catch (e) {
+                this.toast('Invalid schema JSON: ' + e.message, 'error');
+            }
+        },
+        async saveSettings(partial) {
+            const r = await fetch('/api/settings', {
+                method: 'POST',
+                headers: {'Content-Type': 'application/json'},
+                body: JSON.stringify(partial)
+            });
+            this.applyState(await r.json());
+        },
+        async setProvider(p) {
+            if (!this.state.providers.includes(p)) return;
+            await this.saveSettings({provider: p});
+            this.toast(`Provider: ${p}. Models reset to its defaults.`, 'ok');
+        },
+        saveKey() {
+            const k = (this.keyEditor.value || '').trim();
+            if (!k) {
+                if (this.localKey) {
+                    this.toast('No new key entered. Existing key kept.', 'warn');
+                } else {
+                    this.toast('Paste a key first.', 'warn');
+                }
+                return;
+            }
+            this.setLocalKey(k);
+            this.keyEditor.value = '';
+            this.keyEditor.result = '';
+            this.keyEditor.ok = false;
+            this.toast(`✓ ${this.state.provider} key saved in this tab (${k.length} chars). Pill above should turn green.`, 'ok');
+            this.closeModal();
+        },
+        clearKey() {
+            this.setLocalKey('');
+            this.keyEditor.value = '';
+            this.keyEditor.result = '';
+            this.keyEditor.ok = false;
+            this.toast(`${this.state.provider} key cleared from this tab.`, 'ok');
+        },
+        async testKey(autoSaveOnSuccess = false) {
+            const k = (this.keyEditor.value || this.localKey || '').trim();
+            if (!k) {
+                this.keyEditor.result = 'Paste a key first.';
+                this.keyEditor.ok = false;
+                return;
+            }
+            this.keyEditor.testing = true;
+            this.keyEditor.result = '';
+            try {
+                const r = await fetch('/api/settings/test_key', {
+                    method: 'POST',
+                    headers: {'Content-Type': 'application/json'},
+                    body: JSON.stringify({api_key: k, provider: this.state.provider})
+                });
+                const j = await r.json();
+                this.keyEditor.ok = j.ok;
+                this.keyEditor.result = (j.ok ? '✓ ' : '✗ ') + j.message;
+                if (j.ok && autoSaveOnSuccess) {
+                    this.setLocalKey(k);
+                    this.keyEditor.value = '';
+                    this.toast(`✓ ${this.state.provider} key tested & saved (${k.length} chars).`, 'ok');
+                }
+            } catch (e) {
+                this.keyEditor.ok = false;
+                this.keyEditor.result = '✗ ' + e.message;
+            }
+            this.keyEditor.testing = false;
+        },
+        async toggleModel(m) {
+            const set = new Set(this.state.models);
+            if (set.has(m)) set.delete(m); else set.add(m);
+            await this.saveSettings({models: Array.from(set)});
+        },
+        async addCustomModel() {
+            const slug = (this.modelEditor.custom || '').trim();
+            if (!slug) return;
+            const set = new Set(this.state.models);
+            set.add(slug);
+            await this.saveSettings({models: Array.from(set)});
+            this.modelEditor.custom = '';
+        },
+        async saveAdvanced() {
+            await this.saveSettings({
+                n_icl: this.advEditor.n_icl,
+                temperature: this.advEditor.temperature,
+                system_prompt: this.advEditor.system_prompt,
+                user_template: this.advEditor.user_template,
+            });
+            this.toast('Advanced settings saved.', 'ok');
+            this.closeModal();
+        },
+        // ----------- corpus loading -----------
+        async loadExercise(idx) {
+            this.loading = true;
+            try {
+                const r = await fetch('/api/corpus/exercise', {
+                    method: 'POST',
+                    headers: {'Content-Type': 'application/json'},
+                    body: JSON.stringify({idx})
+                });
+                this.applyState(await r.json());
+                this.taskEditor.json = JSON.stringify(this.state.schema, null, 2);
+                this.toast(`Loaded: ${this.state.exercises[idx].title}`, 'ok');
+            } finally {
+                this.loading = false;
+            }
+        },
+        onTagKeydown(e) {
+            if (e.key === 'Enter' || e.key === ',' || e.key === ';') {
+                e.preventDefault();
+                this.addCustomTag();
+            }
+        },
+        addCustomTag() {
+            const raw = (this.pasteEditor.customTagInput || '').trim();
+            if (!raw) return;
+            const parts = raw.split(/[,;\n\t]+/).map(t => t.trim()).filter(Boolean);
+            for (const t of parts) {
+                if (!this.pasteEditor.customTags.includes(t)) {
+                    this.pasteEditor.customTags.push(t);
+                }
+            }
+            this.pasteEditor.customTagInput = '';
+        },
+        buildCustomSchema() {
+            const fields = [];
+            const baseTags = this.pasteEditor.customTags.slice();
+            const values = this.pasteEditor.includeNone
+                ? (baseTags.includes('O') ? baseTags : ['O', ...baseTags])
+                : baseTags;
+            fields.push({
+                name: 'tag',
+                type: 'enum',
+                values,
+                nullable: false,
+                aggregator: 'vote',
+                subfields: [],
+            });
+            if (this.pasteEditor.includeConfidence) {
+                fields.push({
+                    name: 'confidence',
+                    type: 'enum',
+                    values: ['low', 'medium', 'high'],
+                    nullable: false,
+                    aggregator: 'min',
+                    subfields: []
+                });
+            }
+            if (this.pasteEditor.includeComment) {
+                fields.push({
+                    name: 'comment',
+                    type: 'string',
+                    values: [],
+                    nullable: true,
+                    aggregator: 'priority',
+                    subfields: []
+                });
+            }
+            return {
+                task_name: this.pasteEditor.customTaskName || 'Custom task',
+                language: this.pasteEditor.language || '',
+                description: '',
+                fields,
+            };
+        },
+        async loadPaste() {
+            // flush any pending tag still in the input
+            if ((this.pasteEditor.customTagInput || '').trim()) this.addCustomTag();
+            this.loading = true;
+            try {
+                // 1) Set the task BEFORE loading text (so the ICL pool & state are consistent)
+                if (this.pasteEditor.presetKey === 'custom') {
+                    if (this.pasteEditor.customTags.length === 0) {
+                        this.toast('Add at least one tag in the custom set.', 'warn');
+                        return;
+                    }
+                    const annotation_schema = this.buildCustomSchema();
+                    const r0 = await fetch('/api/task/schema', {
+                        method: 'POST',
+                        headers: {'Content-Type': 'application/json'},
+                        body: JSON.stringify({annotation_schema})
+                    });
+                    if (!r0.ok) {
+                        this.toast('Schema rejected: ' + (await r0.json()).detail, 'error');
+                        return;
+                    }
+                    this.applyState(await r0.json());
+                } else if (this.pasteEditor.presetKey) {
+                    const r0 = await fetch('/api/task/preset', {
+                        method: 'POST',
+                        headers: {'Content-Type': 'application/json'},
+                        body: JSON.stringify({key: this.pasteEditor.presetKey})
+                    });
+                    if (r0.ok) this.applyState(await r0.json());
+                }
+                // 2) Load the text
+                const r = await fetch('/api/corpus/paste', {
+                    method: 'POST', headers: {'Content-Type': 'application/json'}, body: JSON.stringify({
+                        text: this.pasteEditor.text,
+                        tokenizer: this.pasteEditor.tokenizer,
+                        language: this.pasteEditor.language,
+                    })
+                });
+                this.applyState(await r.json());
+                this.closeModal();
+                this.toast(`Loaded ${this.state.sentences.length} sentence(s). Task: ${this.state.schema?.task_name}.`, 'ok');
+            } finally {
+                this.loading = false;
+            }
+        },
+        async clearCorpus() {
+            const r = await fetch('/api/corpus/clear', {method: 'POST'});
+            this.applyState(await r.json());
+        },
+        async resetAll() {
+            if (!confirm('Reset everything? This wipes:\n• loaded corpus\n• annotations\n• ICL pool\n• custom task/schema\n• prompt overrides\n\nYour API key (browser-only) is kept.')) return;
+            this.loading = true;
+            try {
+                const r = await fetch('/api/reset', {method: 'POST'});
+                this.applyState(await r.json());
+                this.selection = new Set();
+                this.focus = {sent: null, tok: null};
+                this.modal = null;
+                this.toast('Workspace reset.', 'ok');
+            } finally {
+                this.loading = false;
+            }
+        },
+        async clearIcl() {
+            const r = await fetch('/api/icl/clear', {method: 'POST'});
+            this.applyState(await r.json());
+        },
+        // ----------- annotation -----------
+        async annotateAll() {
+            if (!this.canRun || this.loading) return;
+            this.loading = true;
+            this.progressText = `Annotating ${this.state.sentences.length} sentences…`;
+            // Optimistic UI: nouvelle référence pour Alpine
+            this.state.sentences = this.state.sentences.map(s =>
+                s.status !== 'done' ? {...s, status: 'annotating'} : s
+            );
+            try {
+                const r = await fetch('/api/annotate', {
+                    method: 'POST',
+                    headers: {'Content-Type': 'application/json', ...this.keyHeaders()},
+                    body: JSON.stringify({})
+                });
+                if (!r.ok) throw new Error((await r.json()).detail);
+                const data = await r.json();
+                this.applyState(data);
+                const dis = this.totalDisagreements;
+                this.toast(
+                    `Done. ${dis} disagreement${dis !== 1 ? 's' : ''} to review.`,
+                    dis > 0 ? 'warn' : 'ok'
+                );
+            } catch (e) {
+                this.toast(e.message, 'error');
+            } finally {
+                this.loading = false;
+            }
+        },
+        async annotateOne(sidx) {
+            if (!this.hasKey) {
+                this.modal = 'key';
+                return;
+            }
+            this.loading = true;
+            this.state.sentences = this.state.sentences.map((s, i) =>
+                i === sidx ? {...s, status: 'annotating'} : s
+            );
+            try {
+                const r = await fetch('/api/annotate', {
+                    method: 'POST',
+                    headers: {'Content-Type': 'application/json', ...this.keyHeaders()},
+                    body: JSON.stringify({sentence_idxs: [sidx]})
+                });
+                if (!r.ok) throw new Error((await r.json()).detail);
+                this.applyState(await r.json());
+                const s = this.state.sentences[sidx];
+                this.toast(`Sentence ${s.id}: ${s.n_disagreements} disagreement(s).`, s.n_disagreements > 0 ? 'warn' : 'ok');
+            } catch (e) {
+                this.toast(e.message, 'error');
+            }
+            this.loading = false;
+        },
+        async addSentenceToIcl(sidx) {
+            const r = await fetch(`/api/sentence/${sidx}/add_to_icl`, {method: 'POST'});
+            if (!r.ok) {
+                this.toast('Could not add to ICL pool.', 'error');
+                return;
+            }
+            const data = await r.json();
+            this.applyState(data);
+            if (data.icl_add_result === 'unchanged') {
+                this.toast(
+                    `Already in ICL pool — unchanged (v${this.state.icl_pool.version}, ${this.state.icl_pool.size} entries).`,
+                    'warn'
+                );
+            } else if (data.icl_add_result === 'updated') {
+                this.toast(
+                    `Updated existing ICL example after correction (v${this.state.icl_pool.version}, ${this.state.icl_pool.size} entries).`,
+                    'ok'
+                );
+            } else {
+                this.toast(
+                    `Added to ICL pool (v${this.state.icl_pool.version}, ${this.state.icl_pool.size} entries).`,
+                    'ok'
+                );
+            }
+        },
+        async setValidated(sidx, value) {
+            const r = await fetch(`/api/sentence/${sidx}/sent_score`, {
+                method: 'POST',
+                headers: {'Content-Type': 'application/json'},
+                body: JSON.stringify({value}),
+            });
+            if (!r.ok) {
+                this.toast('Could not toggle scoring.', 'error');
+                return;
+            }
+            const sent = await r.json();
+            sent._accuracy = this.modelAccuracy(sent);
+            this.replaceSentence(sidx, sent);
+            this.toast(value ? '📊 Showing per-model accuracy vs your current annotation.' : 'Scores hidden.', 'ok');
+        },
+        // ----------- token editor -----------
+        onTokenClick(ev, sidx, tidx) {
+            if (ev.shiftKey) {
+                this.toggleSelectionIdx(sidx, tidx);
+                return;
+            }
+            this.openTokenEditor(sidx, tidx);
+        },
+        openTokenEditor(sidx, tidx) {
+            const sent = this.state.sentences[sidx];
+            const tok = JSON.parse(JSON.stringify(sent.tokens[tidx] || {}));
+            this.editor.sidx = sidx;
+            this.editor.tidx = tidx;
+            this.editor.tok = tok;
+            this.editor.original = JSON.parse(JSON.stringify(tok));  // snapshot for diff
+            this.editor.search = {};
+            this.editor.filtered = {};
+            this.editor.perModel = sent.per_model || {};
+            this.editor.disagreementCells = (sent.disagreements || []).filter(d => d.token_idx === tidx);
+            this.editor.propagateToSimilar = false;
+            this.focus = {sent: sidx, tok: tidx};
+            this.modal = 'token';
+        },
+        matchingTokenCount() {
+            if (!this.editor.tok) return 0;
+            const surf = this.editor.tok.surface;
+            let n = 0;
+            for (let s = 0; s < this.state.sentences.length; s++) {
+                for (let t = 0; t < this.state.sentences[s].tokens.length; t++) {
+                    if (s === this.editor.sidx && t === this.editor.tidx) continue;
+                    if (this.state.sentences[s].tokens[t].surface === surf) n++;
+                }
+            }
+            return n;
+        },
+        fieldChanges() {
+            const out = {};
+            if (!this.editor.tok || !this.editor.original) return out;
+            for (const k of Object.keys(this.editor.tok)) {
+                if (k === 'surface' || k.startsWith('_')) continue;
+                const a = JSON.stringify(this.editor.tok[k] ?? null);
+                const b = JSON.stringify(this.editor.original[k] ?? null);
+                if (a !== b) out[k] = this.editor.tok[k];
+            }
+            return out;
+        },
+        fieldChangesSummary() {
+            const c = this.fieldChanges();
+            return Object.entries(c).map(([k, v]) => {
+                const val = (v === null || v === undefined) ? '∅' : (typeof v === 'object' ? JSON.stringify(v) : String(v));
+                return `${k}=${val}`;
+            }).join(', ');
+        },
+        refreshFilter(name, values) {
+            const q = (this.editor.search[name] || '').toLowerCase();
+            this.editor.filtered[name] = values.filter(v => v.toLowerCase().includes(q));
+        },
+        adoptFromModel(model) {
+            const sent = this.state.sentences[this.editor.sidx];
+            const t = (sent.per_model[model]?.tokens || [])[this.editor.tidx];
+            if (!t) return;
+            // copy all fields except surface
+            const surface = this.editor.tok.surface;
+            this.editor.tok = {...t, surface};
+            this.toast(`Adopted from ${this.modelShort(model)}.`, 'ok');
+        },
+        async reaskOneToken(model) {
+            try {
+                const r = await fetch('/api/annotate/token', {
+                    method: 'POST',
+                    headers: {'Content-Type': 'application/json', ...this.keyHeaders()},
+                    body: JSON.stringify({
+                        sent: this.editor.sidx, tok: this.editor.tidx, model,
+                    })
+                });
+                if (!r.ok) throw new Error((await r.json()).detail);
+                const sent = await r.json();
+                this.replaceSentence(this.editor.sidx, sent);
+                // re-open with the new token
+                this.openTokenEditor(this.editor.sidx, this.editor.tidx);
+                this.toast(`Re-asked ${this.modelShort(model)}.`, 'ok');
+            } catch (e) {
+                this.toast(e.message, 'error');
+            }
+        },
+        async reaskOneTokenAt(sidx, tidx, model) {
+            this.editor.sidx = sidx;
+            this.editor.tidx = tidx;
+            await this.reaskOneToken(model);
+        },
+        async saveToken() {
+    const sidx = this.editor.sidx;
+    const tidx = this.editor.tidx;
+    const surface = this.editor.tok.surface;
+    const changes = this.fieldChanges();
+    const wantPropagate =
+        this.editor.propagateToSimilar &&
+        Object.keys(changes).length > 0 &&
+        this.matchingTokenCount() > 0;
+    this.editor.tok._corrected = true;
+    const r = await fetch(`/api/sentence/${sidx}/token/${tidx}`, {
         method: 'POST',
+        headers: {'Content-Type': 'application/json'},
+        body: JSON.stringify({token: this.editor.tok})
+    });
+    if (!r.ok) {
+        this.toast('Save failed.', 'error');
         return;
+    }
+    // returns full state to ensure consistency
+    const data = await r.json();
+    this.applyState(data);
+    let propagatedCount = 0;
+    if (wantPropagate) {
         try {
+            const r2 = await fetch('/api/bulk_similar', {
+                method: 'POST',
+                headers: {'Content-Type': 'application/json'},
+                body: JSON.stringify({
+                    surface,
+                    updates: changes,
+                    exclude: [{s: sidx, t: tidx}],
+                }),
+            });
+            if (r2.ok) {
+                const j = await r2.json();
+                for (const item of (j.sentences || [])) {
+                    this.replaceSentence(item.idx, item.sentence);
+                }
+                propagatedCount = (j.affected || []).length;
+            }
         } catch (e) {
+            this.toast('Propagation failed: ' + e.message, 'error');
         }
+    }
+    let iclMsg = '';
+    if (data.icl_add_result === 'updated') {
+        iclMsg = ` + updated ICL v${this.state.icl_pool.version}`;
+    } else if (data.icl_add_result === 'inserted') {
+        iclMsg = ` + added to ICL v${this.state.icl_pool.version}`;
+    } else if (data.icl_add_result === 'unchanged') {
+        iclMsg = ` + ICL unchanged`;
+    }
+    // auto-advance
+    if (this.editor.autoAdvance) {
         const next = this.findNextDisagreement(sidx, tidx);
         if (next) {
+            this.openTokenEditor(next.s, next.t);
+            this.toast(
+                propagatedCount > 0
+                    ? `✓ Saved + propagated to ${propagatedCount} other "${surface}"${iclMsg}.`
+                    : `✓ Saved${iclMsg}.`,
+                'ok'
+            );
+            return;
         }
+    }
+    this.closeModal();
+    this.toast(
+        propagatedCount > 0
+            ? `✓ Saved + propagated to ${propagatedCount} other "${surface}"${iclMsg}.`
+            : `✓ Saved${iclMsg}.`,
+        'ok'
+    );
+},
+        findNextDisagreement(sidx, tidx) {
+            const sents = this.state.sentences;
+            // search rest of current sentence
+            const sent = sents[sidx];
+            const more = (sent.disagreements || []).filter(d => d.token_idx > tidx).sort((a, b) => a.token_idx - b.token_idx);
+            if (more.length > 0) return {s: sidx, t: more[0].token_idx};
+            // next sentences
+            for (let i = sidx + 1; i < sents.length; i++) {
+                const ds = sents[i].disagreements || [];
+                if (ds.length > 0) {
+                    const t = ds.sort((a, b) => a.token_idx - b.token_idx)[0].token_idx;
+                    return {s: i, t};
+                }
+            }
+            return null;
+        },
+        moveToken(delta) {
+            const sent = this.state.sentences[this.editor.sidx];
+            const next = this.editor.tidx + delta;
+            if (next < 0 || next >= sent.tokens.length) return;
+            this.openTokenEditor(this.editor.sidx, next);
+        },
+        // ----------- selection / bulk -----------
+        toggleSelectionIdx(sidx, tidx) {
+            const k = `${sidx}:${tidx}`;
+            if (this.selection.has(k)) this.selection.delete(k);
+            else this.selection.add(k);
+            // alpine reactivity: replace Set
+            this.selection = new Set(this.selection);
+        },
+        clearSelection() {
+            this.selection = new Set();
+        },
+        bulkSelectedField() {
+            return this.schemaFields.find(f => f.name === this.bulkEditor.field);
+        },
+        async applyBulk() {
+            const bySent = {};
+            for (const k of this.selection) {
+                const [s, t] = k.split(':').map(Number);
+                if (!bySent[s]) bySent[s] = [];
+                bySent[s].push(t);
+            }
+            for (const [s, idxs] of Object.entries(bySent)) {
+                const r = await fetch(`/api/sentence/${s}/bulk`, {
+                    method: 'POST', headers: {'Content-Type': 'application/json'}, body: JSON.stringify({
+                        token_idxs: idxs, field: this.bulkEditor.field, value: this.bulkEditor.value,
+                    })
+                });
+                if (r.ok) this.replaceSentence(Number(s), await r.json());
+            }
+            this.clearSelection();
+            this.closeModal();
+            this.toast('Bulk applied.', 'ok');
+        },
+        // ----------- context menu -----------
+        openTokenContext(ev, sidx, tidx) {
+            this.ctxMenu = {open: true, x: ev.clientX, y: ev.clientY, s: sidx, t: tidx};
+        },
+        // ----------- modals -----------
+        closeModal() {
+            this.modal = null;
+            this.$nextTick(() => {
+                this.editor.sidx = null;
+                this.editor.tidx = null;
+                this.editor.tok = null;
+                this.editor.original = null;
+                this.editor.perModel = {};
+                this.editor.disagreementCells = [];
+            });
+        },
+        // ----------- keyboard -----------
+        globalKey(e) {
+            // editor-modal: route to editor keys
+            if (this.modal === 'token' && this.editor.tok) {
+                if (e.key === 'Escape') {
+                    this.closeModal();
+                    e.preventDefault();
+                    return;
+                }
+                if (e.key === 'Enter' && !(e.target.tagName === 'INPUT' || e.target.tagName === 'TEXTAREA')) {
+                    this.saveToken();
+                    e.preventDefault();
+                    return;
+                }
+                if (e.key === 'ArrowLeft') {
+                    this.moveToken(-1);
+                    e.preventDefault();
+                    return;
+                }
+                if (e.key === 'ArrowRight') {
+                    this.moveToken(1);
+                    e.preventDefault();
+                    return;
+                }
+                // 1-9 → assign primary enum
+                const num = parseInt(e.key);
+                if (!isNaN(num) && num >= 1 && num <= 9) {
+                    const enums = this.schemaFields.filter(f => f.type === 'enum' && f.name !== 'confidence');
+                    if (enums.length > 0) {
+                        const f = enums[0];
+                        const visible = this.editor.filtered[f.name] || f.values;
+                        const v = visible[num - 1];
+                        if (v) {
+                            this.editor.tok[f.name] = v;
+                            e.preventDefault();
+                        }
+                    }
+                }
+                return;
+            }
+            if (this.modal) {
+                if (e.key === 'Escape') {
+                    this.closeModal();
+                    e.preventDefault();
+                }
+                return;
+            }
+            if (e.target.tagName === 'INPUT' || e.target.tagName === 'TEXTAREA') return;
+            // global shortcuts
+            if (e.key === 'j') {
+                this.moveFocus(1);
+                e.preventDefault();
+            } else if (e.key === 'k') {
+                this.moveFocus(-1);
+                e.preventDefault();
+            } else if (e.key === 'e' || e.key === 'Enter') {
+                if (this.focus.sent !== null) {
+                    this.openTokenEditor(this.focus.sent, this.focus.tok);
+                    e.preventDefault();
+                }
+            } else if (e.key === 'x') {
+                if (this.focus.sent !== null) {
+                    this.toggleSelectionIdx(this.focus.sent, this.focus.tok);
+                    e.preventDefault();
+                }
+            } else if (e.key === 'r') {
+                if (this.focus.sent !== null) {
+                    this.annotateOne(this.focus.sent);
+                    e.preventDefault();
+                }
+            } else if (e.key === 'Escape') {
+                this.clearSelection();
+            }
+        },
+        handleKey(e) { /* main panel passthrough — globalKey handles all */
+        },
+        moveFocus(delta) {
+            const sents = this.state.sentences;
+            if (sents.length === 0) return;
+            if (this.focus.sent === null) {
+                this.focus = {sent: 0, tok: 0};
+                return;
+            }
+            let s = this.focus.sent, t = this.focus.tok + delta;
+            while (s >= 0 && s < sents.length) {
+                if (t < 0) {
+                    s -= 1;
+                    if (s < 0) return;
+                    t = sents[s].tokens.length - 1;
+                    continue;
+                }
+                if (t >= sents[s].tokens.length) {
+                    s += 1;
+                    t = 0;
+                    continue;
+                }
+                this.focus = {sent: s, tok: t};
+                // scroll into view
+                this.$nextTick(() => {
+                    const el = document.querySelector(`button.token-base[data-sent="${s}"][data-tok="${t}"]`);
+                    if (el) el.scrollIntoView({block: 'center', behavior: 'smooth'});
+                });
+                return;
+            }
+        },
+        // ----------- toasts -----------
+        toast(msg, kind = 'ok') {
+            const id = this.nextToastId++;
+            this.toasts.push({id, msg, kind});
+            setTimeout(() => {
+                this.toasts = this.toasts.filter(t => t.id !== id);
+            }, 3500);
+        },
+        // ----------- markdown -> html (minimal) -----------
+        markdownToHtml(md) {
+            // very lightweight; safe enough for trusted local content
+            let h = md
+                .replace(/&/g, '&amp;').replace(/</g, '&lt;').replace(/>/g, '&gt;')
+                .replace(/^### (.*)$/gm, '<h3>$1</h3>')
+                .replace(/^## (.*)$/gm, '<h2>$1</h2>')
+                .replace(/^# (.*)$/gm, '<h1>$1</h1>')
+                .replace(/\*\*(.+?)\*\*/g, '<strong>$1</strong>')
+                .replace(/`([^`]+)`/g, '<code>$1</code>')
+                .replace(/^- (.*)$/gm, '<li>$1</li>')
+                .replace(/^\d+\. (.*)$/gm, '<li>$1</li>');
+            h = h.replace(/(<li>.*<\/li>\n?)+/g, m => '<ul>' + m + '</ul>');
+            h = h.split(/\n{2,}/).map(p => /^<[hul]/.test(p) ? p : '<p>' + p.replace(/\n/g, '<br>') + '</p>').join('\n');
+            return h;
+        },
+    };
 }

static/index.html CHANGED Viewed

The diff for this file is too large to render. See raw diff