Watch the model propose, verify, and refine — turn by turn.

Pick any OpenAI-compatible endpoint, point it at one PhysiX system, and step through the episode. Every turn's equation, reward breakdown, latency, and raw completion are dumped below so you can audit exactly what the model said and what the verifier did with it. No LLM-as-judge — rewards come from forward-simulating each proposal and comparing to observation.

{name} {value.toFixed(2)}

= 0.7 ? muted ? "bg-accentBlue/60" : "bg-accentGreen/70" : value >= 0.3 ? "bg-accentAmber/70" : "bg-textMuted/40", )} style={{ width: `${Math.max(0, Math.min(1, value)) * 100}%` }} />

); } // --------------------------------------------------------------------- // Model preset picker — three buttons + one (optional) API-key field. // --------------------------------------------------------------------- // // The picker replaces the old "Endpoint dropdown + freeform model id + // hint paragraph" UI. Users always pick one of three known-good models; // the API-key field only appears when the picked endpoint needs one // (just the HF Router 7B preset today). Per-preset connections are // persisted in localStorage by base URL via `loadApiKey` / `saveApiKey`, // so a token typed for the 7B preset survives a page reload and isn't // shown when the trained PhysiX preset is selected (it doesn't need // one). interface ModelPresetPickerProps { connection: LlmConnection; onChange: (next: LlmConnection) => void; disabled?: boolean; } function ModelPresetPicker({ connection, onChange, disabled, }: ModelPresetPickerProps): JSX.Element { const selected = presetForConnection(connection) ?? MODEL_PRESETS[0]!; const endpoint = findEndpoint(selected.connection.endpointId); const needsKey = endpoint.needsKey; const [revealKey, setRevealKey] = useState(false); // Hydrate the API key from per-URL storage whenever the preset (and // therefore base URL) changes. useEffect(() => { if (!connection.baseUrl) return; const stored = loadApiKey(connection.baseUrl); if (stored && stored !== connection.apiKey) { onChange({ ...connection, apiKey: stored }); } // eslint-disable-next-line react-hooks/exhaustive-deps }, [connection.baseUrl]); function selectPreset(preset: ModelPreset): void { onChange({ ...preset.connection, apiKey: loadApiKey(preset.connection.baseUrl), }); } function setApiKey(key: string): void { saveApiKey(connection.baseUrl, key); onChange({ ...connection, apiKey: key }); } return (

Pick a model

Three known-good options — the trained PhysiX-3B, its Qwen 3B base, and a Qwen 7B baseline. No URLs to type, no model ids to paste.

{MODEL_PRESETS.map((preset) => ( selectPreset(preset)} /> ))}

{needsKey ? ( HF token (required) setApiKey(e.target.value)} disabled={disabled} placeholder="hf_..." className="w-full rounded-lg border border-border bg-surfaceMuted px-3 py-2 font-mono text-xs text-textPrimary outline-none transition focus:border-textMuted disabled:opacity-50" /> Get one at{" "}


              huggingface.co/settings/tokens

{" "} with the "Make calls to Inference Providers" permission. Saved per endpoint in your browser. ) : null} {/* Live banner only when the picked preset hits the GPU Space. */} {selected.connection.endpointId === "physix" ? ( ) : null}

); } interface PresetCardProps { preset: ModelPreset; selected: boolean; disabled: boolean; onSelect: () => void; } function PresetCard({ preset, selected, disabled, onSelect, }: PresetCardProps): JSX.Element { return ( ); } function ErrorRow({ message, onDismiss, }: { message: string; onDismiss: () => void; }): JSX.Element { return (

{message}

); } function RunPlaceholder({ status }: { status: RunnerStatus }): JSX.Element { if (status === "starting") { return (

); } return (

Configure a connection above and press Run to start an episode.

); } // --------------------------------------------------------------------------- function Field({ label, children, }: { label: string; children: React.ReactNode; }): JSX.Element { return ( {label} {children} ); } function prettySystemId(id: string): string { return id.replace(/_/g, " "); }

Watch the model propose, verify, and refine — turn by turn.

Observed vs predicted —{" "} {primaryVariable}(t)

Transcript — every turn