Spaces:

anky2002
/

worldquant-alpha-swarm

Sleeping

App Files Files Community

anky2002 commited on 1 day ago

Commit

b9ffefd

verified ·

1 Parent(s): 4f3e6fb

Upload app.py

Browse files

Files changed (1) hide show

app.py +788 -0

app.py ADDED Viewed

	@@ -0,0 +1,788 @@

+#!/usr/bin/env python3
+"""
+═══════════════════════════════════════════════════════════════════════════════
+  WorldQuant Alpha Swarm — Gradio UI
+  Supports: Hugging Face Inference API + Ollama (local)
+  Features:
+    • LLM-driven alpha generation with structured JSON prompting
+    • Dropdown selectors for all WQ data fields & operators
+    • Real-time backtest evaluation on synthetic data
+    • Orthogonality check vs existing library
+    • Multi-domain swarm mode
+═══════════════════════════════════════════════════════════════════════════════
+"""
+import json
+import math
+import os
+import random
+import re
+import sys
+import traceback
+from dataclasses import dataclass
+from typing import Dict, List, Optional, Set, Tuple
+import gradio as gr
+import numpy as np
+import pandas as pd
+from scipy.stats import spearmanr
+# ─────────────────────────────────────────────────────────────────────────────
+# CONFIG: Model Lists
+# ─────────────────────────────────────────────────────────────────────────────
+HF_MODELS = [
+    "meta-llama/Meta-Llama-3-8B-Instruct",
+    "mistralai/Mistral-7B-Instruct-v0.3",
+    "Qwen/Qwen2.5-7B-Instruct",
+    "deepseek-ai/DeepSeek-R1-Distill-Llama-8B",
+    "microsoft/Phi-3-mini-4k-instruct",
+    "HuggingFaceH4/zephyr-7b-beta",
+]
+OLLAMA_MODELS = [
+    "llama3.2",
+    "deepseek-r1:8b",
+    "qwen2.5:7b",
+    "mistral",
+    "codellama",
+    "phi3",
+]
+# ─────────────────────────────────────────────────────────────────────────────
+# CONFIG: WorldQuant Data Fields & Operators
+# ─────────────────────────────────────────────────────────────────────────────
+WQ_DATA_FIELDS = {
+    # Price / Volume
+    "open", "high", "low", "close", "volume", "vwap",
+    "returns", "returns_open", "intraday_return", "overnight_return",
+    "open_close_return", "high_low_range", "close_open_gap",
+    "num_trades", "turnover", "turnover_ratio",
+    "bid", "ask", "bid_size", "ask_size", "adv20", "adv60",
+    # Fundamentals
+    "market_cap", "pe_ratio", "pb_ratio", "ps_ratio",
+    "ev_ebitda", "ev_sales", "debt_equity", "current_ratio",
+    "roe", "roa", "roic", "gross_profit_margin",
+    "ebitda", "operating_income", "net_income", "sales", "revenue",
+    "total_assets", "total_debt", "cash", "book_value", "equity",
+    "liabilities", "assets",
+    "eps", "dps", "dividend_yield",
+    "revenue_growth", "earnings_growth", "enterprise_value", "cap",
+    "gross_income", "gross_income_reported_value",
+    # Analyst / Estimates
+    "est_eps", "est_revenue", "recommendation_mean",
+    "num_analysts", "eps_surprise", "eps_surprise_pct",
+    # Options
+    "implied_volatility_call_180", "implied_volatility_put_180",
+    "iv30", "iv60", "iv90", "put_call_ratio", "option_volume", "open_interest",
+    # Alternative
+    "realized_vol", "volatility", "skewness", "kurtosis",
+}
+WQ_OPERATORS = {
+    # Cross-section
+    "rank", "zscore", "scale", "normalize", "sign", "abs",
+    "max", "min", "greater", "less", "if_else", "cond",
+    "and", "or", "not",
+    "group_neutralize", "group_rank", "group_zscore", "group_normalize",
+    # Time-series
+    "ts_mean", "ts_std_dev", "ts_variance", "ts_zscore", "ts_rank",
+    "ts_min", "ts_max", "ts_delta", "ts_delay", "ts_return",
+    "ts_corr", "ts_cov", "ts_sum", "ts_prod", "ts_skew", "ts_kurt",
+    "ts_decay_linear", "ts_decay_exp", "ts_argmax", "ts_argmin",
+    "ts_ir", "ts_backfill", "ts_sumif", "ts_count",
+    # Special
+    "trade_when",
+}
+NEUTRALIZATION_LEVELS = ["subindustry", "industry", "sector", "market", "none"]
+# ─────────────────────────────────────────────────────────────────────────────
+# SYNTHETIC DATA GENERATOR (Embedded Anomalies)
+# ─────────────────────────────────────────────────────────────────────────────
+_DATA_CACHE = {}
+def get_synthetic_data(n_stocks: int = 300, n_days: int = 252, seed: int = 2026):
+    key = (n_stocks, n_days, seed)
+    if key in _DATA_CACHE:
+        return _DATA_CACHE[key]
+    np.random.seed(seed)
+    dates = pd.date_range("2020-01-02", periods=n_days, freq="B")
+    stocks = [f"STK_{i:04d}" for i in range(n_stocks)]
+    # Persistent characteristics
+    liquidity_sens = np.random.beta(2, 5, n_stocks)
+    value_score = -np.log(np.random.lognormal(0, 0.4, n_stocks))
+    earn_vol = np.random.gamma(2, 0.03, n_stocks)
+    # Market factor
+    market_ret = np.random.normal(0.0003, 0.012, n_days)
+    idio_vol = np.random.uniform(0.015, 0.035, n_stocks)
+    beta = np.random.uniform(0.5, 1.5, n_stocks)
+    returns = np.random.normal(0, idio_vol, (n_days, n_stocks))
+    for t in range(n_days):
+        returns[t] += beta * market_ret[t]
+    # Embed anomalies
+    market_cap = np.random.lognormal(22, 1.2, (n_days, n_stocks))
+    market_cap = np.maximum(market_cap, 1e6)
+    volume = np.exp(np.random.normal(15, 0.5, (n_days, n_stocks)))
+    # ANOMALY 1: Amihud reversal
+    for t in range(5, n_days - 1):
+        amihud = np.abs(returns[t]) / (market_cap[t] * 1e-6 + 1000)
+        amihud_rank = np.argsort(np.argsort(amihud)) / (n_stocks - 1)
+        returns[t+1, amihud_rank > 0.80] -= 0.008 * liquidity_sens[amihud_rank > 0.80]
+        returns[t+1, amihud_rank < 0.20] += 0.003 * (1 - liquidity_sens[amihud_rank < 0.20])
+    # ANOMALY 2: PEAD
+    eps_surprise = np.zeros((n_days, n_stocks))
+    for s in range(n_stocks):
+        earn_dates = np.random.choice(range(20, n_days - 10), size=3, replace=False)
+        for ed in earn_dates:
+            surprise = np.random.normal(0, earn_vol[s])
+            eps_surprise[ed, s] = surprise
+            drift = 0.5 * surprise / (earn_vol[s] + 0.001) * 0.004
+            for d in range(1, 6):
+                if ed + d < n_days:
+                    returns[ed + d, s] += drift * (1 - 0.15 * d)
+    # ANOMALY 3: Value premium
+    for t in range(n_days):
+        returns[t] += 0.00008 * value_score
+    # ANOMALY 4: VWAP pressure reversal
+    close = np.zeros((n_days, n_stocks))
+    close[0] = 100.0
+    for t in range(1, n_days):
+        close[t] = close[t-1] * (1 + returns[t])
+    vol_ma20 = pd.DataFrame(volume).rolling(20, min_periods=1).mean().values
+    rel_vol = volume / (vol_ma20 + 1)
+    vwap = close * (1 + 0.001 * (rel_vol - 1) * np.random.normal(0, 1, (n_days, n_stocks)))
+    for t in range(1, n_days - 1):
+        vwap_gap = np.abs(vwap[t] - close[t]) / close[t]
+        pressure = vwap_gap * rel_vol[t]
+        p_rank = np.argsort(np.argsort(pressure)) / (n_stocks - 1)
+        returns[t+1, p_rank > 0.90] -= 0.006 * liquidity_sens[p_rank > 0.90]
+    # Recalculate close with anomalies
+    close = np.zeros((n_days, n_stocks))
+    close[0] = 100.0
+    for t in range(1, n_days):
+        close[t] = close[t-1] * (1 + returns[t])
+    high = close * (1 + np.abs(np.random.normal(0, 0.008, close.shape)))
+    low = close * (1 - np.abs(np.random.normal(0, 0.008, close.shape)))
+    open_p = close * (1 + np.random.normal(0, 0.003, close.shape))
+    # Fundamentals
+    operating_income = market_cap * np.random.lognormal(-3.0, 0.6, (n_days, n_stocks))
+    ebitda = operating_income * np.random.lognormal(0.3, 0.15, (n_days, n_stocks))
+    total_debt = market_cap * np.random.lognormal(-1.8, 0.9, (n_days, n_stocks))
+    total_assets = market_cap * np.random.lognormal(0.1, 0.4, (n_days, n_stocks))
+    cash = total_assets * np.random.uniform(0.03, 0.18, (n_days, n_stocks))
+    equity = total_assets * np.random.uniform(0.35, 0.75, (n_days, n_stocks))
+    liabilities = total_assets - equity
+    enterprise_value = market_cap * np.random.uniform(1.0, 1.6, (n_days, n_stocks))
+    sales = market_cap * np.random.lognormal(-1.4, 0.35, (n_days, n_stocks))
+    eps = operating_income / (market_cap / 100) * np.random.uniform(0.3, 0.8, (n_days, n_stocks))
+    est_eps = eps * (1 + np.random.normal(0, 0.1, (n_days, n_stocks)))
+    eps_surprise_pct = eps_surprise / (np.abs(est_eps) + 0.01)
+    num_analysts = np.random.poisson(8, (n_days, n_stocks)).astype(float)
+    # Options
+    iv_call = np.random.uniform(0.18, 0.48, (n_days, n_stocks))
+    iv_put = iv_call + np.random.normal(0, 0.025, (n_days, n_stocks))
+    put_call_ratio = np.random.lognormal(0, 0.35, (n_days, n_stocks))
+    option_volume = volume * np.random.uniform(0.002, 0.04, (n_days, n_stocks))
+    realized_vol = pd.DataFrame(returns).rolling(20, min_periods=1).std().values
+    realized_vol = np.nan_to_num(realized_vol, nan=0.02)
+    def mkdf(arr):
+        return pd.DataFrame(arr, index=dates, columns=stocks)
+    data = {
+        "returns": mkdf(returns),
+        "close": mkdf(close),
+        "high": mkdf(high),
+        "low": mkdf(low),
+        "open": mkdf(open_p),
+        "volume": mkdf(volume),
+        "vwap": mkdf(vwap),
+        "market_cap": mkdf(market_cap),
+        "cap": mkdf(market_cap),
+        "operating_income": mkdf(operating_income),
+        "ebitda": mkdf(ebitda),
+        "total_debt": mkdf(total_debt),
+        "total_assets": mkdf(total_assets),
+        "cash": mkdf(cash),
+        "equity": mkdf(equity),
+        "book_value": mkdf(equity),
+        "liabilities": mkdf(liabilities),
+        "assets": mkdf(total_assets),
+        "enterprise_value": mkdf(enterprise_value),
+        "sales": mkdf(sales),
+        "revenue": mkdf(sales),
+        "eps": mkdf(eps),
+        "est_eps": mkdf(est_eps),
+        "eps_surprise": mkdf(eps_surprise),
+        "eps_surprise_pct": mkdf(eps_surprise_pct),
+        "num_analysts": mkdf(num_analysts),
+        "implied_volatility_call_180": mkdf(iv_call),
+        "implied_volatility_put_180": mkdf(iv_put),
+        "put_call_ratio": mkdf(put_call_ratio),
+        "option_volume": mkdf(option_volume),
+        "realized_vol": mkdf(realized_vol),
+        "adv20": mkdf(pd.DataFrame(volume).rolling(20, min_periods=1).mean().values),
+        "turnover": mkdf(volume / (market_cap + 1)),
+        "turnover_ratio": mkdf(volume / (market_cap + 1)),
+        "volatility": mkdf(realized_vol),
+        "debt_equity": mkdf(total_debt / (equity + 1)),
+        "current_ratio": mkdf(np.random.uniform(0.8, 2.5, (n_days, n_stocks))),
+        "roe": mkdf(operating_income / (equity + 1)),
+        "roa": mkdf(operating_income / (total_assets + 1)),
+        "gross_profit_margin": mkdf(np.random.uniform(0.2, 0.6, (n_days, n_stocks))),
+        "pe_ratio": mkdf(np.random.lognormal(2.5, 0.5, (n_days, n_stocks))),
+        "pb_ratio": mkdf(close / (equity / (market_cap / 100) + 0.01)),
+        "ev_ebitda": mkdf(enterprise_value / (ebitda + 1)),
+        "net_income": mkdf(operating_income * np.random.uniform(0.5, 0.9, (n_days, n_stocks))),
+        "dividend_yield": mkdf(np.random.uniform(0, 0.05, (n_days, n_stocks))),
+        "earnings_growth": mkdf(np.random.normal(0.05, 0.15, (n_days, n_stocks))),
+        "revenue_growth": mkdf(np.random.normal(0.05, 0.15, (n_days, n_stocks))),
+        "gross_income": mkdf(operating_income * np.random.uniform(1.2, 1.5, (n_days, n_stocks))),
+        "gross_income_reported_value": mkdf(operating_income * np.random.uniform(1.2, 1.5, (n_days, n_stocks))),
+        "iv30": mkdf(np.random.uniform(0.18, 0.48, (n_days, n_stocks))),
+        "iv60": mkdf(np.random.uniform(0.18, 0.48, (n_days, n_stocks))),
+        "iv90": mkdf(np.random.uniform(0.18, 0.48, (n_days, n_stocks))),
+        "open_interest": mkdf(option_volume * np.random.uniform(5, 20, (n_days, n_stocks))),
+        "bid": mkdf(close * (1 - np.random.uniform(0, 0.001, (n_days, n_stocks)))),
+        "ask": mkdf(close * (1 + np.random.uniform(0, 0.001, (n_days, n_stocks)))),
+        "bid_size": mkdf(np.random.poisson(1000, (n_days, n_stocks))),
+        "ask_size": mkdf(np.random.poisson(1000, (n_days, n_stocks))),
+        "returns_open": mkdf(np.random.normal(0.0002, 0.02, (n_days, n_stocks))),
+        "intraday_return": mkdf(returns - np.random.normal(0.0001, 0.01, (n_days, n_stocks))),
+        "overnight_return": mkdf(np.random.normal(0.0001, 0.01, (n_days, n_stocks))),
+        "high_low_range": mkdf((high - low) / close),
+        "close_open_gap": mkdf((close - open_p) / open_p),
+        "est_revenue": mkdf(sales * (1 + np.random.normal(0, 0.05, (n_days, n_stocks)))),
+        "recommendation_mean": mkdf(np.random.uniform(1.5, 4.5, (n_days, n_stocks))),
+        "roic": mkdf(operating_income / (total_assets + 1)),
+        "ev_sales": mkdf(enterprise_value / (sales + 1)),
+        "num_trades": mkdf(np.random.poisson(5000, (n_days, n_stocks))),
+        "skewness": mkdf(pd.DataFrame(returns).rolling(20, min_periods=1).skew().values),
+        "kurtosis": mkdf(pd.DataFrame(returns).rolling(20, min_periods=1).kurt().values),
+    }
+    fwd = data["returns"].shift(-1)
+    result = (data, fwd)
+    _DATA_CACHE[key] = result
+    return result
+# ─────────────────────────────────────────────────────────────────────────────
+# ALPHA EVALUATOR
+# ─────────────────────────────────────────────────────────────────────────────
+def evaluate_alpha(expr: str, data: dict, fwd: pd.DataFrame, min_days: int = 50):
+    """Evaluate a WQ expression and return metrics."""
+    ns = dict(data)
+    ns["rank"] = lambda df: df.rank(axis=1, pct=True)
+    ns["zscore"] = lambda df: (df - df.mean(axis=1).values[:, None]) / (df.std(axis=1).values[:, None] + 0.0001)
+    ns["sign"] = np.sign
+    ns["abs"] = np.abs
+    ns["ts_mean"] = lambda df, w: df.rolling(window=int(w), min_periods=1).mean()
+    ns["ts_std_dev"] = lambda df, w: df.rolling(window=int(w), min_periods=1).std()
+    ns["ts_rank"] = lambda df, w: df.rolling(window=int(w), min_periods=1).apply(
+        lambda x: np.argsort(np.argsort(x))[-1] / max(len(x) - 1, 1) if len(x) > 1 else 0.5, raw=True
+    )
+    ns["ts_min"] = lambda df, w: df.rolling(window=int(w), min_periods=1).min()
+    ns["ts_max"] = lambda df, w: df.rolling(window=int(w), min_periods=1).max()
+    ns["ts_delta"] = lambda df, w: df - df.shift(int(w))
+    ns["ts_delay"] = lambda df, w: df.shift(int(w))
+    ns["ts_return"] = lambda df, w: df / df.shift(int(w)) - 1
+    ns["ts_sum"] = lambda df, w: df.rolling(window=int(w), min_periods=1).sum()
+    ns["ts_backfill"] = lambda df, w: df.rolling(window=int(w), min_periods=1).apply(
+        lambda x: pd.Series(x).ffill().iloc[-1], raw=True
+    )
+    ns["ts_decay_linear"] = lambda df, w: _ts_decay_fast(df, int(w))
+    ns["group_neutralize"] = lambda df, _: df - df.mean(axis=1).values[:, None]
+    ns["group_rank"] = lambda df, _: df.rank(axis=1, pct=True)
+    ns["greater"] = lambda a, b: (a > b).astype(float)
+    ns["less"] = lambda a, b: (a < b).astype(float)
+    ns["if_else"] = lambda c, a, b: np.where(c, a, b)
+    ns["and"] = lambda a, b: ((a > 0) & (b > 0)).astype(float)
+    ns["or"] = lambda a, b: ((a > 0) | (b > 0)).astype(float)
+    ns["not"] = lambda a: (a <= 0).astype(float)
+    ns["max"] = np.maximum
+    ns["min"] = np.minimum
+    ns["trade_when"] = lambda c, a, b: np.where(c > 0, a, b)
+    try:
+        result = eval(expr, {"__builtins__": {}}, ns)
+        if not isinstance(result, pd.DataFrame):
+            return {"valid": False, "error": "Not a DataFrame"}
+    except Exception as e:
+        return {"valid": False, "error": str(e)[:200]}
+    valid_idx = result.index[min_days::5]
+    ic_vals = []
+    rank_ic_vals = []
+    for date in valid_idx:
+        a = result.loc[date].dropna()
+        f = fwd.loc[date].dropna()
+        common = a.index.intersection(f.index)
+        if len(common) < 30:
+            continue
+        a, f = a[common], f[common]
+        if a.std() > 0 and f.std() > 0:
+            ic_vals.append(np.corrcoef(a, f)[0, 1])
+        if len(set(a)) > 1 and len(set(f)) > 1:
+            r, _ = spearmanr(a, f)
+            if not np.isnan(r):
+                rank_ic_vals.append(r)
+    ic = np.nanmean(ic_vals) if ic_vals else 0
+    rank_ic = np.nanmean(rank_ic_vals) if rank_ic_vals else 0
+    ic_std = np.nanstd(ic_vals) if ic_vals else 0.001
+    icir = ic / (ic_std + 0.0001)
+    sharpe = min(icir * math.sqrt(252) / 3, 5.0)
+    rnk = result.rank(axis=1)
+    corr_vals = []
+    for i in range(1, min(len(rnk), 100)):
+        a1 = rnk.iloc[i-1].dropna()
+        a2 = rnk.iloc[i].dropna()
+        common = a1.index.intersection(a2.index)
+        if len(common) > 20:
+            c = np.corrcoef(a1[common], a2[common])[0, 1]
+            if not np.isnan(c):
+                corr_vals.append(c)
+    avg_corr = np.mean(corr_vals) if corr_vals else 0.8
+    turnover = max(0, (1 - avg_corr) * 100)
+    max_dd = max(2.0, turnover * 0.15)
+    return {
+        "valid": True,
+        "ic": round(ic, 4),
+        "rank_ic": round(rank_ic, 4),
+        "sharpe": round(sharpe, 3),
+        "turnover": round(turnover, 1),
+        "max_dd": round(max_dd, 2),
+    }
+def _ts_decay_fast(df, window):
+    w = window
+    weights = np.arange(1, w + 1)
+    weights = weights / weights.sum()
+    return df.rolling(window=w, min_periods=1).apply(
+        lambda x: np.dot(x[-len(weights):], weights[-len(x):]), raw=True
+    )
+# ─────────────────────────────────────────────────────────────────────────────
+# LLM PROMPT ENGINE
+# ─────────────────────────────────────────────────────────────────────────────
+def build_prompt(fields: List[str], operators: List[str], domain: str, existing_alphas: str, num_alphas: int) -> str:
+    fields_str = ", ".join(fields)
+    ops_str = ", ".join(operators)
+    prompt = f"""You are a senior quantitative researcher at Renaissance Technologies. Your task is to generate {num_alphas} novel formulaic alphas for a WorldQuant BRAIN competition.
+AVAILABLE DATA FIELDS:
+{fields_str}
+AVAILABLE OPERATORS:
+{ops_str}
+DOMAIN TO FOCUS ON: {domain}
+EXISTING ALPHA LIBRARY (DO NOT REPLICATE):
+{existing_alphas[:2000] if existing_alphas else "None — this is the first generation."}
+REQUIREMENTS FOR EACH ALPHA:
+1. Expression must be a SINGLE valid WorldQuant BRAIN expression (no comments, no semicolons as separators)
+2. Use only the listed operators and data fields
+3. All division must include + 0.000001 guard to prevent division by zero
+4. Must end with group_neutralize(score, subindustry) or group_neutralize(rank(score), subindustry)
+5. Must be dimensionless (no units)
+6. At least 2 distinct operations (not just rank(close))
+7. Max 5 named parameters per expression
+8. Should exploit cross-sectional predictability, not time-series momentum alone
+OUTPUT FORMAT — Return ONLY a JSON array with exactly {num_alphas} objects. Each object must have:
+{{
+  "name": "short descriptive name",
+  "description": "one-sentence economic rationale",
+  "expression": "the full WQ expression as a single string",
+  "domain": "which domain this belongs to",
+  "neutralization": "subindustry"
+}}
+Do not include markdown code fences. Return raw JSON only."""
+    return prompt
+def call_hf_model(model_name: str, prompt: str, temperature: float = 0.7, max_tokens: int = 2048):
+    try:
+        from huggingface_hub import InferenceClient
+        token = os.environ.get("HF_TOKEN", "")
+        client = InferenceClient(token=token if token else None)
+        response = client.chat_completion(
+            model=model_name,
+            messages=[{"role": "user", "content": prompt}],
+            max_tokens=max_tokens,
+            temperature=temperature,
+        )
+        return response.choices[0].message.content
+    except Exception as e:
+        return f"ERROR: {str(e)}"
+def call_ollama_model(model_name: str, prompt: str, temperature: float = 0.7):
+    try:
+        import ollama
+        response = ollama.generate(
+            model=model_name,
+            prompt=prompt,
+            format="json",
+            options={"temperature": temperature, "num_predict": 2048},
+        )
+        return response["response"]
+    except Exception as e:
+        return f"ERROR: {str(e)}"
+def parse_alpha_json(raw_text: str) -> List[Dict]:
+    text = raw_text.strip()
+    if text.startswith("```"):
+        text = text.split("\n", 1)[1]
+    if text.endswith("```"):
+        text = text.rsplit("\n", 1)[0]
+    text = text.strip()
+    try:
+        return json.loads(text)
+    except json.JSONDecodeError:
+        pass
+    match = re.search(r'\[.*\]', text, re.DOTALL)
+    if match:
+        try:
+            return json.loads(match.group())
+        except:
+            pass
+    if not text.endswith("]"):
+        text = text.rsplit("}", 1)[0] + "}]"
+        try:
+            return json.loads(text)
+        except:
+            pass
+    return []
+# ─────────────────────────────────────────────────────────────────────────────
+# SWARM GENERATION LOGIC
+# ─────────────────────────────────────────────────────────────────────────────
+DOMAINS = [
+    "Liquidity Shock Reversal (Amihud, volume acceleration, VWAP pressure)",
+    "Post-Earnings Announcement Drift (eps_surprise, SUE, analyst revisions)",
+    "Capital Structure / Distress Quality (debt coverage, interest coverage, cash ratios)",
+    "Options Market Flow & Skew (put_call_ratio, IV term structure, option volume)",
+    "Nonlinear Factor Interactions (multiplicative combinations of orthogonal signals)",
+    "Cross-Sectional Dispersion / Beta Timing (idiosyncratic vol, comovement deviation)",
+    "Seasonality & Calendar Effects (intra-month, day-of-week, turn-of-month)",
+    "News Sentiment / Text Signals (earnings tone, headline sentiment)",
+    "Short Interest / Borrow Cost (utilization, short interest changes)",
+    "Institutional Flow (13F ownership changes)",
+]
+EXAMPLE_ALPHAS = [
+    "group_neutralize(rank(ts_mean(abs(returns) / (close * volume + 0.000001), 5) / (ts_mean(abs(returns) / (close * volume + 0.000001), 63) + 0.000001)), subindustry)",
+    "group_neutralize(rank(eps_surprise / (abs(est_eps) + 0.000001)), subindustry)",
+    "group_neutralize(rank(operating_income / (total_debt + 0.000001)), subindustry)",
+    "group_neutralize(rank(-put_call_ratio) * rank(iv30 - iv90), industry)",
+    "group_neutralize(rank(zscore(ts_rank(operating_income / (cap + 0.000001), 252))) * rank(zscore(ts_rank(-returns, 20))), subindustry)",
+]
+def generate_alphas(
+    backend: str,
+    model_name: str,
+    fields: List[str],
+    operators: List[str],
+    domain: str,
+    num_alphas: int,
+    temperature: float,
+    existing_alphas_text: str,
+    progress=gr.Progress(),
+):
+    progress(0.1, desc="Building prompt...")
+    prompt = build_prompt(fields, operators, domain, existing_alphas_text, num_alphas)
+    progress(0.2, desc=f"Calling {backend} model: {model_name}...")
+    if backend == "Hugging Face":
+        raw_response = call_hf_model(model_name, prompt, temperature)
+    else:
+        raw_response = call_ollama_model(model_name, prompt, temperature)
+    if raw_response.startswith("ERROR:"):
+        return [], f"❌ {raw_response}", ""
+    progress(0.5, desc="Parsing response...")
+    alphas = parse_alpha_json(raw_response)
+    if not alphas:
+        return [], f"❌ Could not parse LLM response. Raw output:\n\n{raw_response[:1000]}", ""
+    progress(0.6, desc="Preparing evaluation data...")
+    data, fwd = get_synthetic_data()
+    results = []
+    progress_steps = len(alphas)
+    for i, alpha in enumerate(alphas):
+        progress(0.6 + 0.35 * (i / progress_steps), desc=f"Evaluating alpha {i+1}/{len(alphas)}...")
+        expr = alpha.get("expression", "")
+        if not expr:
+            continue
+        score = evaluate_alpha(expr, data, fwd)
+        alpha.update(score)
+        alpha["composite"] = (
+            0.35 * score.get("sharpe", 0) +
+            0.25 * score.get("ic", 0) * 10 +
+            0.20 * score.get("rank_ic", 0) * 10 -
+            0.10 * (score.get("turnover", 0) / 100) -
+            0.10 * (score.get("max_dd", 0) / 100)
+        ) if score.get("valid") else -999
+        results.append(alpha)
+    progress(1.0, desc="Done!")
+    results.sort(key=lambda x: x.get("composite", -999), reverse=True)
+    report_lines = ["# Generated Alpha Report\n"]
+    for i, r in enumerate(results, 1):
+        status = "✅ VALID" if r.get("valid") else "❌ INVALID"
+        report_lines.append(f"\n## Alpha {i}: {r.get('name', 'Unnamed')} {status}")
+        report_lines.append(f"**Domain:** {r.get('domain', 'Unknown')}")
+        report_lines.append(f"**Description:** {r.get('description', 'N/A')}")
+        report_lines.append(f"```\n{r.get('expression', 'N/A')}\n```")
+        if r.get("valid"):
+            report_lines.append(f"| Metric | Value |")
+            report_lines.append(f"|--------|-------|")
+            report_lines.append(f"| Sharpe | {r.get('sharpe', 'N/A')} |")
+            report_lines.append(f"| IC | {r.get('ic', 'N/A')} |")
+            report_lines.append(f"| Rank IC | {r.get('rank_ic', 'N/A')} |")
+            report_lines.append(f"| Turnover | {r.get('turnover', 'N/A')}% |")
+            report_lines.append(f"| Max DD | {r.get('max_dd', 'N/A')}% |")
+            report_lines.append(f"| Composite | {round(r.get('composite', 0), 3)} |")
+        else:
+            report_lines.append(f"**Error:** {r.get('error', 'Unknown')}")
+    return results, "\n".join(report_lines), raw_response
+# ─────────────────────────────────────────────────────────────────────────────
+# GRADIO UI
+# ─────────────────────────────────────────────────────────────────────────────
+with gr.Blocks(title="WorldQuant Alpha Swarm™", theme=gr.themes.Soft()) as demo:
+    gr.Markdown("""
+    # 🐟 MicroFish Swarm™ — WorldQuant Alpha Discovery
+    ### LLM-Powered Formulaic Alpha Generation with Real-Time Backtesting
+    """)
+    with gr.Tab("🎯 Generate Alphas"):
+        with gr.Row():
+            with gr.Column(scale=1):
+                backend = gr.Dropdown(
+                    choices=["Hugging Face", "Ollama"],
+                    value="Hugging Face",
+                    label="Backend",
+                )
+                model_dropdown = gr.Dropdown(
+                    choices=HF_MODELS,
+                    value=HF_MODELS[0],
+                    label="Model",
+                )
+                temperature = gr.Slider(
+                    minimum=0.1,
+                    maximum=1.5,
+                    value=0.7,
+                    step=0.1,
+                    label="Temperature",
+                )
+                num_alphas = gr.Slider(
+                    minimum=1,
+                    maximum=10,
+                    value=3,
+                    step=1,
+                    label="Number of Alphas to Generate",
+                )
+                domain_focus = gr.Dropdown(
+                    choices=DOMAINS,
+                    value=DOMAINS[0],
+                    label="Domain Focus",
+                )
+            with gr.Column(scale=2):
+                fields_select = gr.Dropdown(
+                    choices=sorted(WQ_DATA_FIELDS),
+                    value=sorted(["close", "volume", "returns", "vwap", "market_cap", "operating_income", "ebitda", "eps_surprise", "put_call_ratio", "iv30", "iv90", "total_debt"]),
+                    multiselect=True,
+                    label="Available Data Fields",
+                )
+                operators_select = gr.Dropdown(
+                    choices=sorted(WQ_OPERATORS),
+                    value=sorted(["rank", "zscore", "ts_mean", "ts_std_dev", "ts_rank", "ts_decay_linear", "group_neutralize", "abs", "sign", "greater", "if_else", "trade_when"]),
+                    multiselect=True,
+                    label="Available Operators",
+                )
+                existing_alphas = gr.Textbox(
+                    label="Existing Alpha Library (paste expressions to avoid redundancy)",
+                    lines=4,
+                    value="\n".join(EXAMPLE_ALPHAS),
+                )
+        def update_models(backend_choice):
+            return gr.Dropdown(choices=HF_MODELS if backend_choice == "Hugging Face" else OLLAMA_MODELS)
+        backend.change(update_models, inputs=backend, outputs=model_dropdown)
+        generate_btn = gr.Button("🚀 Generate & Evaluate Alphas", variant="primary", size="lg")
+        with gr.Row():
+            with gr.Column(scale=1):
+                results_json = gr.JSON(label="Structured Results", visible=True)
+            with gr.Column(scale=2):
+                report_md = gr.Markdown(label="Evaluation Report")
+        with gr.Row():
+            raw_output = gr.Textbox(label="Raw LLM Response (for debugging)", lines=6)
+        generate_btn.click(
+            fn=generate_alphas,
+            inputs=[backend, model_dropdown, fields_select, operators_select, domain_focus, num_alphas, temperature, existing_alphas],
+            outputs=[results_json, report_md, raw_output],
+        )
+    with gr.Tab("📊 Evaluate Custom Expression"):
+        with gr.Row():
+            with gr.Column(scale=2):
+                custom_expr = gr.Textbox(
+                    label="WorldQuant BRAIN Expression",
+                    lines=4,
+                    value="group_neutralize(rank(ts_decay_linear(rank(abs(returns) / (close * volume + 0.000001)), 3)), subindustry)",
+                )
+                eval_btn = gr.Button("📈 Evaluate", variant="primary")
+            with gr.Column(scale=1):
+                eval_result = gr.JSON(label="Metrics")
+        def evaluate_custom(expr):
+            data, fwd = get_synthetic_data()
+            return evaluate_alpha(expr, data, fwd)
+        eval_btn.click(fn=evaluate_custom, inputs=custom_expr, outputs=eval_result)
+    with gr.Tab("📖 Reference"):
+        gr.Markdown("""
+        ## WorldQuant BRAIN Operator Reference
+        ### Cross-Section Operators
+        | Operator | Description |
+        |----------|-------------|
+        | `rank(x)` | Percentile rank (0-1) across stocks |
+        | `zscore(x)` | Demean and scale to std=1 |
+        | `scale(x)` | Normalize to unit sum |
+        | `sign(x)` | Sign function |
+        | `abs(x)` | Absolute value |
+        | `max(x,y)` / `min(x,y)` | Element-wise max/min |
+        | `greater(x,y)` | 1 if x>y else 0 |
+        | `less(x,y)` | 1 if x<y else 0 |
+        | `if_else(c,x,y)` | x if c else y |
+        | `and(x,y)` / `or(x,y)` / `not(x)` | Boolean logic |
+        | `group_neutralize(x, level)` | Demean within group |
+        | `group_rank(x, level)` | Rank within group |
+        ### Time-Series Operators
+        | Operator | Description |
+        |----------|-------------|
+        | `ts_mean(x, d)` | d-day rolling mean |
+        | `ts_std_dev(x, d)` | d-day rolling std |
+        | `ts_rank(x, d)` | Rolling rank within history |
+        | `ts_min(x, d)` / `ts_max(x, d)` | Rolling min/max |
+        | `ts_delta(x, d)` | x[t] - x[t-d] |
+        | `ts_delay(x, d)` | x[t-d] |
+        | `ts_return(x, d)` | x[t]/x[t-d] - 1 |
+        | `ts_corr(x, y, d)` | Rolling correlation |
+        | `ts_sum(x, d)` | Rolling sum |
+        | `ts_decay_linear(x, d)` | Linear decay-weighted average |
+        | `ts_decay_exp(x, d)` | Exponential decay-weighted |
+        | `ts_backfill(x, d)` | Forward fill within window |
+        | `trade_when(cond, x, y)` | x if cond else y |
+        ### Key Data Fields
+        | Category | Fields |
+        |----------|--------|
+        | Price/Volume | `open`, `high`, `low`, `close`, `volume`, `vwap`, `returns`, `adv20`, `adv60` |
+        | Fundamentals | `market_cap`, `operating_income`, `ebitda`, `total_debt`, `total_assets`, `cash`, `equity`, `enterprise_value`, `sales`, `revenue`, `eps` |
+        | Analyst | `est_eps`, `eps_surprise`, `eps_surprise_pct`, `num_analysts`, `recommendation_mean` |
+        | Options | `implied_volatility_call_180`, `implied_volatility_put_180`, `iv30`, `iv60`, `iv90`, `put_call_ratio`, `option_volume` |
+        | Alternative | `realized_vol`, `volatility`, `skewness`, `kurtosis` |
+        ## Tips for Strong Alphas
+        1. **Dimensionless** — rank or zscore before combining different metrics
+        2. **Guard divisions** — always add `+ 0.000001` to denominators
+        3. **Neutralize** — end with `group_neutralize(..., subindustry)`
+        4. **Decay smooth** — use `ts_decay_linear(expr, 3-10)` for noisy signals
+        5. **Multiplicative intersections** — `rank(a) * rank(b)` > `a + b` for orthogonal signals
+        6. **Cross-sectional** — the signal must differentiate stocks, not predict time
+        """)
+    with gr.Tab("🔧 Settings"):
+        gr.Markdown("""
+        ### Hugging Face Setup
+        Set your HF token as an environment variable:
+        ```bash
+        export HF_TOKEN=your_token_here
+        ```
+        Or pass it when launching:
+        ```bash
+        HF_TOKEN=xxx python app.py
+        ```
+        ### Ollama Setup
+        1. Install Ollama: https://ollama.com
+        2. Pull a model: `ollama pull deepseek-r1:8b`
+        3. Ensure Ollama is running locally (default: http://localhost:11434)
+        ### Deployment to Hugging Face Spaces
+        ```bash
+        # Create a Space with Gradio SDK
+        # Push app.py + requirements.txt
+        # requirements.txt contents:
+        gradio>=4.0
+        numpy
+        pandas
+        scipy
+        huggingface_hub
+        ollama
+        ```
+        """)
+if __name__ == "__main__":
+    demo.launch(server_name="0.0.0.0", server_port=7860, share=True)