Spaces:

anugrah55
/

cernenv

Sleeping

App Files Files Community

anugrah55 commited on 12 days ago

Commit

7103888

verified ·

1 Parent(s): 2b0bffa

Update CERNenv Space

Browse files

Files changed (2) hide show

server/app.py +105 -3
space/training/app.py +22 -22

server/app.py CHANGED Viewed

@@ -1,16 +1,107 @@
-"""FastAPI app exposing ``CERNCollisionEnvironment`` over the OpenEnv HTTP API."""
 from __future__ import annotations
 import os
 from typing import Optional
 from openenv.core.env_server import create_fastapi_app
 from models import CollisionObservation, ExperimentAction
 from server.environment import CERNCollisionEnvironment
 def make_env_factory(
     max_steps: int,
     default_difficulty: Optional[str],
@@ -29,9 +120,20 @@ def build_app(
     max_steps: int = 40,
     default_difficulty: Optional[str] = None,
 ):
-    """Construct the FastAPI app with a per-session environment factory."""
     factory = make_env_factory(max_steps=max_steps, default_difficulty=default_difficulty)
-    return create_fastapi_app(factory, ExperimentAction, CollisionObservation)
 app = build_app(

+"""FastAPI app exposing ``CERNCollisionEnvironment`` over the OpenEnv HTTP API.
+We delegate the standard OpenEnv routes (``/reset``, ``/step``, ``/state``,
+``/schema``, ``/health``, ``/mcp``) to ``create_fastapi_app`` and add a
+human-friendly landing page at ``/`` so the Hugging Face Space preview
+shows the project description instead of a 404.
+"""
 from __future__ import annotations
 import os
 from typing import Optional
+from fastapi.responses import HTMLResponse
 from openenv.core.env_server import create_fastapi_app
 from models import CollisionObservation, ExperimentAction
 from server.environment import CERNCollisionEnvironment
+_LANDING_PAGE = """\
+<!doctype html>
+<html lang=en>
+<head>
+  <meta charset=utf-8>
+  <title>CERNenv — LHC Discovery RL Environment</title>
+  <meta name=viewport content="width=device-width,initial-scale=1">
+  <style>
+    body { font-family: ui-sans-serif, system-ui, -apple-system, sans-serif;
+           margin: 2rem auto; max-width: 780px; color:#111; padding: 0 1rem; line-height:1.5 }
+    h1 { margin-bottom: .25rem }
+    h2 { margin-top: 2rem; border-bottom: 1px solid #eee; padding-bottom: .25rem }
+    code { background:#f4f4f4; padding:.05rem .35rem; border-radius:4px; font-size:.95em }
+    pre  { background:#0e1116; color:#e6edf3; padding:1rem; border-radius:6px; overflow-x:auto }
+    pre code { background:transparent; color:inherit; padding:0 }
+    .pill { display:inline-block; padding:.1rem .55rem; border-radius:999px;
+            background:#e8f0ff; color:#1d4ed8; font-size:.85em; margin-right:.25rem }
+    .muted { color:#666 }
+    a { color:#1d4ed8 }
+    table { border-collapse:collapse; margin: .5rem 0 }
+    th,td { text-align:left; padding:.25rem .9rem .25rem 0; vertical-align: top }
+    th { color:#444; font-weight:600 }
+  </style>
+</head>
+<body>
+  <h1>⚛️ CERNenv</h1>
+  <p class=muted>An LHC (Large Hadron Collider) particle-discovery RL environment for autonomous physicist agents — built for the Meta OpenEnv Hackathon.</p>
+  <p>
+    <span class=pill>OpenEnv</span>
+    <span class=pill>POMDP</span>
+    <span class=pill>16 action types</span>
+    <span class=pill>3 difficulty levels</span>
+    <span class=pill>HTTP + WebSocket</span>
+  </p>
+  <h2>What this is</h2>
+  <p>
+    A Large Language Model (LLM) agent plays a high-energy physicist running an
+    analysis at the LHC. Each step it picks one structured action — configure
+    the beam, allocate luminosity, set a trigger, collect collisions, fit a
+    resonance, estimate significance, submit a discovery claim, and so on —
+    and receives a noisy detector-style observation. The latent particle
+    (mass, decay channel, branching ratios, width) is hidden ground truth.
+    Reward decomposes into per-step shaping + a dominant terminal calibration
+    against the truth particle.
+  </p>
+  <h2>API</h2>
+  <table>
+    <tr><th><code>GET  /health</code></th><td>liveness probe</td></tr>
+    <tr><th><code>GET  /schema</code></th><td>JSON schemas for actions, observations, state</td></tr>
+    <tr><th><code>POST /reset</code></th><td>start a new episode (e.g. <code>{"seed": 7, "scenario": "easy_diphoton_160"}</code>)</td></tr>
+    <tr><th><code>POST /step</code></th><td>execute one action (<code>{"action": {"action_type": ..., "parameters": {...}, "justification": "..."}}</code>)</td></tr>
+    <tr><th><code>GET  /state</code></th><td>current public state snapshot</td></tr>
+    <tr><th><code>GET  /docs</code></th><td>interactive Swagger UI</td></tr>
+    <tr><th><code>GET  /metadata</code></th><td>environment metadata</td></tr>
+  </table>
+  <h2>Quickstart</h2>
+  <pre><code># reset
+curl -X POST $URL/reset \\
+  -H 'Content-Type: application/json' \\
+  -d '{"seed": 7, "scenario": "easy_diphoton_160"}'
+# step
+curl -X POST $URL/step \\
+  -H 'Content-Type: application/json' \\
+  -d '{"action": {"action_type": "configure_beam",
+                 "parameters": {"sqrt_s_tev": 13.0},
+                 "justification": "set 13 TeV"}}'</code></pre>
+  <h2>Companion Spaces</h2>
+  <ul>
+    <li>📓 Trainer (Unsloth + LoRA + GRPO on A100): <a href="https://huggingface.co/spaces/anugrah55/cernenv-trainer">anugrah55/cernenv-trainer</a></li>
+    <li>🎯 Trained adapters (LoRA): <a href="https://huggingface.co/anugrah55/cernenv-grpo-qwen2.5-3b">anugrah55/cernenv-grpo-qwen2.5-3b</a></li>
+  </ul>
+  <p class=muted style="margin-top:2rem">CERNenv · OpenEnv-compatible · BSD-3-Clause</p>
+</body>
+</html>
+"""
 def make_env_factory(
     max_steps: int,
     default_difficulty: Optional[str],
     max_steps: int = 40,
     default_difficulty: Optional[str] = None,
 ):
+    """Construct the FastAPI app with a per-session environment factory.
+    The OpenEnv-provided routes (`/reset`, `/step`, `/state`, `/schema`,
+    `/health`, `/mcp`) come from ``create_fastapi_app``. We then mount a
+    friendly landing page at ``/`` so the Space preview is informative.
+    """
     factory = make_env_factory(max_steps=max_steps, default_difficulty=default_difficulty)
+    fa_app = create_fastapi_app(factory, ExperimentAction, CollisionObservation)
+    @fa_app.get("/", response_class=HTMLResponse, include_in_schema=False)
+    def landing() -> HTMLResponse:  # pragma: no cover - trivial
+        return HTMLResponse(_LANDING_PAGE)
+    return fa_app
 app = build_app(

space/training/app.py CHANGED Viewed

@@ -297,17 +297,17 @@ _HTML = """\
   <meta charset=utf-8>
   <title>CERNenv Trainer</title>
   <style>
-    body {{ font-family: ui-sans-serif, system-ui, sans-serif; margin: 2rem auto; max-width: 760px; color:#111 }}
-    h1 {{ margin-bottom: 0 }}
-    .muted {{ color:#666 }}
-    pre {{ background:#0e1116; color:#e6edf3; padding:1rem; border-radius:6px; overflow-x:auto; max-height:50vh }}
-    button {{ font-size:1rem; padding:.6rem 1rem; border-radius:6px; border:1px solid #888; background:#fff; cursor:pointer }}
-    .pill {{ display:inline-block; padding:.1rem .5rem; border-radius:999px; background:#eef; color:#225 }}
-    .ok {{ background:#dfd; color:#272 }}
-    .fail {{ background:#fdd; color:#822 }}
-    .run {{ background:#fdf6d8; color:#774 }}
-    table {{ border-collapse:collapse; }}
-    td {{ padding:.2rem .8rem .2rem 0; }}
   </style>
 </head>
 <body>
@@ -326,31 +326,31 @@ _HTML = """\
   <pre id=logs>loading…</pre>
 <script>
-async function refresh() {{
   const s = await fetch('/status').then(r => r.json());
   const pill = document.getElementById('status');
   pill.textContent = s.status;
-  pill.className = 'pill ' + ({{idle:'',running:'run',finished:'ok',failed:'fail'}}[s.status] || '');
   const meta = document.getElementById('meta');
   meta.innerHTML = '';
-  for (const [k, v] of Object.entries({{
     started_at: s.started_at, finished_at: s.finished_at, error: s.last_error,
-    ...(s.last_config || {{}}),
-  }})) {{
     if (v == null || v === '') continue;
     const tr = document.createElement('tr');
-    tr.innerHTML = `<td><b>${{k}}</b></td><td><code>${{v}}</code></td>`;
     meta.appendChild(tr);
-  }}
   const logs = await fetch('/logs?tail=200').then(r => r.text());
   document.getElementById('logs').textContent = logs || '(no logs yet)';
-}}
-async function startRun() {{
-  await fetch('/train', {{method:'POST'}});
   setTimeout(refresh, 500);
-}}
 refresh();
 setInterval(refresh, 5000);
 </script>

   <meta charset=utf-8>
   <title>CERNenv Trainer</title>
   <style>
+    body { font-family: ui-sans-serif, system-ui, sans-serif; margin: 2rem auto; max-width: 760px; color:#111 }
+    h1 { margin-bottom: 0 }
+    .muted { color:#666 }
+    pre { background:#0e1116; color:#e6edf3; padding:1rem; border-radius:6px; overflow-x:auto; max-height:50vh }
+    button { font-size:1rem; padding:.6rem 1rem; border-radius:6px; border:1px solid #888; background:#fff; cursor:pointer }
+    .pill { display:inline-block; padding:.1rem .5rem; border-radius:999px; background:#eef; color:#225 }
+    .ok { background:#dfd; color:#272 }
+    .fail { background:#fdd; color:#822 }
+    .run { background:#fdf6d8; color:#774 }
+    table { border-collapse:collapse; }
+    td { padding:.2rem .8rem .2rem 0; }
   </style>
 </head>
 <body>
   <pre id=logs>loading…</pre>
 <script>
+async function refresh() {
   const s = await fetch('/status').then(r => r.json());
   const pill = document.getElementById('status');
   pill.textContent = s.status;
+  pill.className = 'pill ' + ({idle:'',running:'run',finished:'ok',failed:'fail'}[s.status] || '');
   const meta = document.getElementById('meta');
   meta.innerHTML = '';
+  for (const [k, v] of Object.entries({
     started_at: s.started_at, finished_at: s.finished_at, error: s.last_error,
+    ...(s.last_config || {}),
+  })) {
     if (v == null || v === '') continue;
     const tr = document.createElement('tr');
+    tr.innerHTML = `<td><b>${k}</b></td><td><code>${v}</code></td>`;
     meta.appendChild(tr);
+  }
   const logs = await fetch('/logs?tail=200').then(r => r.text());
   document.getElementById('logs').textContent = logs || '(no logs yet)';
+}
+async function startRun() {
+  await fetch('/train', {method:'POST'});
   setTimeout(refresh, 500);
+}
 refresh();
 setInterval(refresh, 5000);
 </script>