Spaces:
Running
Running
| <html lang="en"> | |
| <head> | |
| <meta charset="utf-8"> | |
| <title>Qwopus3.6-27B v1-preview — Evaluation Suite</title> | |
| <style> | |
| :root { color-scheme: dark; } | |
| * { box-sizing: border-box; } | |
| body { | |
| font-family: -apple-system, BlinkMacSystemFont, "SF Pro Text", "Inter", system-ui, sans-serif; | |
| background: radial-gradient(ellipse at top, #1a1025 0%, #07080d 60%); | |
| color: #e9ecf4; | |
| padding: 4rem 1.5rem 6rem; | |
| margin: 0; min-height: 100vh; line-height: 1.55; | |
| } | |
| .wrap { max-width: 920px; margin: 0 auto; } | |
| header { margin-bottom: 3rem; } | |
| .eyebrow { | |
| color: #c4a0ff; font-size: 0.78rem; letter-spacing: 0.22em; | |
| text-transform: uppercase; font-weight: 600; | |
| } | |
| h1 { | |
| font-size: clamp(1.8rem, 4vw, 2.6rem); | |
| font-weight: 700; letter-spacing: -0.025em; | |
| margin: 0.35rem 0 0.4rem; | |
| background: linear-gradient(135deg, #ffffff 0%, #d8b4fe 100%); | |
| -webkit-background-clip: text; background-clip: text; | |
| -webkit-text-fill-color: transparent; | |
| } | |
| .byline { color: #c4a0ff; font-size: 0.92rem; margin: 0.1rem 0 0.9rem; } | |
| .byline a { color: inherit; text-decoration: none; | |
| border-bottom: 1px solid rgba(196,160,255,0.25); } | |
| .byline a:hover { border-bottom-color: #c4a0ff; } | |
| .sub { color: #9aa3bb; max-width: 64ch; } | |
| .cta-row { display: flex; flex-wrap: wrap; gap: 0.7rem; align-items: center; | |
| margin-top: 1.5rem; } | |
| .report-link { | |
| display: inline-flex; align-items: center; gap: 0.5rem; | |
| padding: 0.85rem 1.3rem; | |
| background: linear-gradient(135deg, #a855f7 0%, #ec4899 100%); | |
| color: #fff; border-radius: 10px; text-decoration: none; | |
| font-weight: 600; font-size: 0.95rem; | |
| transition: transform 0.2s ease, filter 0.2s ease; | |
| } | |
| .report-link:hover { transform: translateY(-1px); filter: brightness(1.1); } | |
| .report-link::after { content: " →"; } | |
| .compare-link { | |
| display: inline-flex; align-items: center; gap: 0.5rem; | |
| padding: 0.85rem 1.2rem; | |
| background: rgba(255,255,255,0.05); | |
| border: 1px solid rgba(255,255,255,0.1); | |
| color: #e9ecf4; border-radius: 10px; text-decoration: none; | |
| font-weight: 600; font-size: 0.95rem; | |
| transition: transform 0.2s ease, background 0.2s ease, border-color 0.2s ease; | |
| } | |
| .compare-link:hover { transform: translateY(-1px); | |
| background: rgba(255,255,255,0.09); | |
| border-color: rgba(255,255,255,0.2); } | |
| .follow-link { | |
| display: inline-flex; align-items: center; gap: 0.55rem; | |
| padding: 0.85rem 1.2rem; | |
| background: rgba(255,255,255,0.055); | |
| border: 1px solid rgba(255,255,255,0.1); | |
| color: #e9ecf4; border-radius: 10px; | |
| text-decoration: none; font-weight: 600; font-size: 0.95rem; | |
| transition: transform 0.2s ease, background 0.2s ease, border-color 0.2s ease; | |
| } | |
| .follow-link:hover { transform: translateY(-1px); background: rgba(255,255,255,0.09); | |
| border-color: rgba(255,255,255,0.2); } | |
| .follow-link svg { width: 15px; height: 15px; } | |
| .stats { | |
| display: grid; | |
| grid-template-columns: repeat(auto-fit, minmax(150px, 1fr)); | |
| gap: 1rem; margin: 2rem 0 3rem; | |
| padding: 1.25rem; | |
| background: rgba(255,255,255,0.03); | |
| border: 1px solid rgba(255,255,255,0.06); | |
| border-radius: 14px; | |
| } | |
| .stat b { display:block; font-size: 1.6rem; font-weight: 700; | |
| letter-spacing: -0.02em; color: #ffffff; } | |
| .stat span { color: #7e8aa5; font-size: 0.78rem; | |
| text-transform: uppercase; letter-spacing: 0.12em; } | |
| .stat .delta { display: block; color: #86efac; font-size: 0.85rem; | |
| font-weight: 600; margin-top: 0.25rem; } | |
| h2 { | |
| font-size: 0.85rem; color: #9fa7c0; | |
| text-transform: uppercase; letter-spacing: 0.14em; | |
| font-weight: 600; margin: 3rem 0 1rem; | |
| padding-bottom: 0.6rem; | |
| border-bottom: 1px solid rgba(255,255,255,0.07); | |
| } | |
| .grid { | |
| display: grid; | |
| grid-template-columns: repeat(auto-fill, minmax(280px, 1fr)); | |
| gap: 0.9rem; | |
| } | |
| .card { | |
| display: block; padding: 1.1rem 1.2rem; | |
| background: rgba(255,255,255,0.035); | |
| border: 1px solid rgba(255,255,255,0.07); | |
| border-radius: 11px; | |
| color: inherit; text-decoration: none; | |
| transition: transform 0.22s ease, border-color 0.22s ease, background 0.22s ease; | |
| } | |
| .card:hover { | |
| transform: translateY(-2px); | |
| border-color: rgba(216, 180, 254, 0.45); | |
| background: rgba(216, 180, 254, 0.07); | |
| } | |
| .card strong { | |
| display: block; font-weight: 600; font-size: 0.98rem; | |
| color: #f3f5fa; margin-bottom: 0.25rem; | |
| } | |
| .card span { color: #8b93ab; font-size: 0.82rem; } | |
| .meta { | |
| font-family: ui-monospace, SFMono-Regular, Menlo, Consolas, monospace; | |
| font-size: 0.72rem; color: #6c7693; margin-top: 0.6rem; | |
| } | |
| footer { | |
| margin-top: 5rem; color: #5a6380; | |
| font-size: 0.82rem; text-align: center; | |
| } | |
| .preview-banner { | |
| display: flex; align-items: flex-start; gap: 0.9rem; | |
| margin: 2rem 0 0; | |
| padding: 1.1rem 1.3rem; | |
| background: linear-gradient(135deg, rgba(251,191,36,0.09), rgba(236,72,153,0.07)); | |
| border: 1px solid rgba(251,191,36,0.28); | |
| border-radius: 12px; | |
| font-size: 0.92rem; color: #e9ecf4; line-height: 1.55; | |
| } | |
| .preview-banner .icon { | |
| flex-shrink: 0; | |
| width: 28px; height: 28px; border-radius: 50%; | |
| background: rgba(251,191,36,0.18); | |
| display: grid; place-items: center; | |
| font-size: 0.95rem; color: #fbbf24; font-weight: 700; | |
| } | |
| .preview-banner .pv-title { | |
| font-weight: 700; color: #fde68a; letter-spacing: 0.02em; | |
| display: block; margin-bottom: 0.2rem; | |
| } | |
| .preview-banner a { color: #fde68a; text-decoration: none; | |
| border-bottom: 1px solid rgba(253,230,138,0.35); } | |
| </style> | |
| </head> | |
| <body> | |
| <div class="wrap"> | |
| <header> | |
| <div class="eyebrow">Early-Preview Fine-tune · Round 2</div> | |
| <h1>Qwopus3.6-27B — v1-preview</h1> | |
| <p class="byline">by <a href="https://x.com/KyleHessling1" target="_blank" rel="noopener">Kyle Hessling</a> · built on <a href="https://huggingface.co/Jackrong/Qwopus3.6-27B-v1-preview-GGUF" target="_blank" rel="noopener">Jackrong's fine-tune</a></p> | |
| <p class="sub">Same 16-prompt suite as the Qwen3.6-27B base eval — 5 agentic, 5 web-design, 6 canvas/WebGL. Q4_K_M on a single RTX 5090 via llama.cpp. Byline metrics: <b>62.3 tok/s avg</b>, <b>87.4 k tokens generated</b>, <b>23.4 min runtime</b>.</p> | |
| <div class="preview-banner"> | |
| <div class="icon">!</div> | |
| <div> | |
| <span class="pv-title">This is an early preview — not the final Qwopus 3.6</span> | |
| The v1-preview weights come from a small ~12 K-example training run. I'm currently working with <a href="https://huggingface.co/Jackrong" target="_blank" rel="noopener">Jackrong</a> to land more compute for a full fine-tune pass that'll be orders of magnitude larger and cleaner. Numbers and behaviour on this page will change when the full model ships. | |
| </div> | |
| </div> | |
| <div class="cta-row"> | |
| <a href="report.html" class="report-link">Read the full report</a> | |
| <a href="report.pdf" target="_blank" rel="noopener" class="compare-link" style="display:inline-flex; align-items:center; gap:0.55rem;"> | |
| <svg viewBox="0 0 24 24" width="15" height="15" fill="currentColor" aria-hidden="true"><path d="M14 2H6a2 2 0 0 0-2 2v16a2 2 0 0 0 2 2h12a2 2 0 0 0 2-2V8zM13 9V3.5L18.5 9z"/></svg> | |
| PDF version | |
| </a> | |
| <a href="https://huggingface.co/spaces/KyleHessling1/qwen36-eval" target="_blank" rel="noopener" class="compare-link">Compare · Qwen3.6 base eval</a> | |
| <a href="https://x.com/KyleHessling1" target="_blank" rel="noopener" class="follow-link"> | |
| <svg viewBox="0 0 24 24" fill="currentColor" aria-hidden="true"><path d="M18.244 2.25h3.308l-7.227 8.26 8.502 11.24H16.17l-5.214-6.817L4.99 21.75H1.68l7.73-8.835L1.254 2.25H8.08l4.713 6.231zm-1.161 17.52h1.833L7.084 4.126H5.117z"/></svg> | |
| Follow @KyleHessling1 | |
| </a> | |
| </div> | |
| </header> | |
| <div class="stats"> | |
| <div class="stat"><b>62.3</b><span>avg tok/s</span><span class="delta">+12.7% vs base</span></div> | |
| <div class="stat"><b>16</b><span>runs</span></div> | |
| <div class="stat"><b>87,394</b><span>completion tokens</span></div> | |
| <div class="stat"><b>~20 GB</b><span>VRAM used</span></div> | |
| <div class="stat"><b>65K</b><span>context window</span></div> | |
| </div> | |
| <h2>Web design · open to preview</h2> | |
| <div class="grid"> | |
| <a class="card" href="design_saas_landing.html"><strong>SaaS landing page</strong><span>Prism — AI observability</span><div class="meta">36.7 KB · 9,961 tok · 160 s</div></a> | |
| <a class="card" href="design_analytics_dashboard.html"><strong>Analytics dashboard</strong><span>Light theme, emerald accent</span><div class="meta">37.4 KB · 13,190 tok · 213 s</div></a> | |
| <a class="card" href="design_designer_portfolio.html"><strong>Designer portfolio</strong><span>Maya Chen — kinetic typography</span><div class="meta">23.1 KB · 7,356 tok · 118 s</div></a> | |
| <a class="card" href="design_pricing_page.html"><strong>Pricing page</strong><span>3 tiers + animated toggle + FAQ</span><div class="meta">24.3 KB · 8,061 tok · 129 s</div></a> | |
| <a class="card" href="design_mobile_app_marketing.html"><strong>Mobile app marketing</strong><span>Stillwater — CSS-only iPhone mock</span><div class="meta">29.3 KB · 8,005 tok · 128 s</div></a> | |
| </div> | |
| <h2>Canvas / WebGL · creative coding</h2> | |
| <div class="grid"> | |
| <a class="card" href="canvas_particle_attractor.html"><strong>Particle attractor</strong><span>3000-particle fluid swarm</span><div class="meta">11.1 KB · 4,249 tok · 68 s</div></a> | |
| <a class="card" href="canvas_webgl_shader.html"><strong>WebGL Mandelbulb</strong><span>Raymarched fractal shader</span><div class="meta">11.5 KB · 4,364 tok · 70 s</div></a> | |
| <a class="card" href="canvas_three_scene.html"><strong>Three.js crystal scene</strong><span>Transmissive glass + bloom</span><div class="meta">17.9 KB · 6,375 tok · 102 s</div></a> | |
| <a class="card" href="canvas_physics_sandbox.html"><strong>Physics sandbox</strong><span>Soft-body collisions, fling mouse</span><div class="meta">15.1 KB · 4,384 tok · 70 s</div></a> | |
| <a class="card" href="canvas_audio_reactive.html"><strong>Audio-reactive visualizer</strong><span>Mic + oscillator fallback</span><div class="meta">12.0 KB · 3,018 tok · 48 s</div></a> | |
| </div> | |
| <h2>Agentic reasoning · text output</h2> | |
| <div class="grid"> | |
| <a class="card" href="agentic_multi_step_planning.txt"><strong>Multi-step planning</strong><span>URL shortener deploy plan</span><div class="meta">thinking: 3,158 tok · 50 s</div></a> | |
| <a class="card" href="agentic_self_critique.txt"><strong>Self-critique loop</strong><span>Palindrome · O(n³) → O(n²)</span><div class="meta">thinking: 1,277 tok · 21 s</div></a> | |
| <a class="card" href="agentic_code_debug.txt"><strong>Code debug (4 bugs)</strong><span>k-th smallest element</span><div class="meta">thinking: 1,628 tok · 26 s</div></a> | |
| <a class="card" href="agentic_structured_extraction_nothink.txt"><strong>Structured JSON extraction</strong><span>Calendar + roster from prose</span><div class="meta">no-think rerun · 353 tok</div></a> | |
| <a class="card" href="agentic_tool_use_json.txt"><strong>Tool-use planning</strong><span>Weather + flights + hotel</span><div class="meta">thinking: 1,174 tok · 19 s</div></a> | |
| </div> | |
| <footer> | |
| Model: <code>Jackrong/Qwopus3.6-27B-v1-preview-GGUF — Q4_K_M</code> · served via llama.cpp on a single RTX 5090 | |
| </footer> | |
| </div> | |
| </body> | |
| </html> | |