Spaces:

groundlens
/

groundlens-api

Sleeping

App Files Files Community

AI-that-works commited on 7 days ago

Commit

6d74c84

verified ·

1 Parent(s): 65d8577

Upload 4 files

Browse files

Files changed (4) hide show

Dockerfile +14 -0
README.md +129 -0
app.py +269 -0
requirements.txt +5 -0

Dockerfile ADDED Viewed

	@@ -0,0 +1,14 @@

+FROM python:3.11-slim
+WORKDIR /app
+# Install dependencies first (layer caching)
+COPY requirements.txt .
+RUN pip install --no-cache-dir -r requirements.txt
+COPY . .
+# HF Spaces expects port 7860
+EXPOSE 7860
+CMD ["uvicorn", "app:app", "--host", "0.0.0.0", "--port", "7860"]

README.md ADDED Viewed

	@@ -0,0 +1,129 @@

+---
+title: groundlens API
+emoji: 📐
+colorFrom: yellow
+colorTo: red
+sdk: docker
+pinned: false
+license: mit
+tags:
+- hallucination-detection
+- llm-evaluation
+- rag
+- grounding
+- groundlens
+- api
+short_description: REST API for geometric LLM hallucination detection
+---
+# groundlens API
+REST API for [groundlens](https://groundlens.dev) — LLM hallucination detection using embedding geometry.
+No second LLM. Deterministic. Same inputs → same scores.
+## Endpoints
+| Method | Path | Description |
+|--------|------|-------------|
+| `POST` | `/v1/check` | Auto-selects SGI or DGI based on context |
+| `POST` | `/v1/sgi` | Context-based grounding check |
+| `POST` | `/v1/dgi` | Context-free grounding check |
+| `GET` | `/health` | Liveness + model status |
+| `GET` | `/docs` | Interactive Swagger UI |
+## Quick start
+### Check without context (DGI)
+```bash
+curl -X POST https://groundlens-groundlens-api.hf.space/v1/check \
+  -H "Content-Type: application/json" \
+  -d '{
+    "question": "What is the capital of France?",
+    "response": "The capital of France is Paris."
+  }'
+```
+### Check with context (SGI)
+```bash
+curl -X POST https://groundlens-groundlens-api.hf.space/v1/check \
+  -H "Content-Type: application/json" \
+  -d '{
+    "question": "What does our policy cover?",
+    "response": "The policy covers fire, flood, and theft damage to residential properties.",
+    "context": "HomeShield Insurance Policy: Coverage includes damage from fire, flood, and theft for residential properties within the continental United States."
+  }'
+```
+### Python
+```python
+import requests
+r = requests.post(
+    "https://groundlens-groundlens-api.hf.space/v1/check",
+    json={
+        "question": "What is the capital of France?",
+        "response": "The capital of France is Paris.",
+    },
+)
+print(r.json()["verdict"])  # GROUNDED
+```
+### JavaScript
+```javascript
+const res = await fetch("https://groundlens-groundlens-api.hf.space/v1/check", {
+  method: "POST",
+  headers: { "Content-Type": "application/json" },
+  body: JSON.stringify({
+    question: "What is the capital of France?",
+    response: "The capital of France is Paris.",
+  }),
+});
+const data = await res.json();
+console.log(data.verdict); // GROUNDED
+```
+## Response format
+```json
+{
+  "verdict": "GROUNDED",
+  "flagged": false,
+  "method": "DGI (Directional Grounding Index)",
+  "score": 0.4521,
+  "threshold": 0.30,
+  "explanation": "The response follows patterns typical of grounded answers.",
+  "detail": {
+    "interpretation": "Positive directional alignment with grounded response patterns."
+  },
+  "latency_ms": 45
+}
+```
+## Self-hosting
+```bash
+git clone https://github.com/groundlens-dev/groundlens-api.git
+cd groundlens-api
+pip install -r requirements.txt
+uvicorn app:app --host 0.0.0.0 --port 8000
+```
+Or with Docker:
+```bash
+docker build -t groundlens-api .
+docker run -p 8000:7860 groundlens-api
+```
+## Links
+- [groundlens library](https://github.com/groundlens-dev/groundlens) — `pip install groundlens`
+- [MCP Server](https://github.com/groundlens-dev/groundlens-mcp) — for Claude Desktop, Cursor, Windsurf
+- [Demo](https://huggingface.co/spaces/groundlens/groundlens-demo) — interactive web UI
+- [Documentation](https://docs.groundlens.dev)
+- [Website](https://groundlens.dev)

app.py ADDED Viewed

	@@ -0,0 +1,269 @@

+"""
+groundlens REST API
+Lightweight HTTP wrapper around the groundlens library.
+Deploy on Hugging Face Spaces (Docker SDK), Railway, Fly.io, or any container host.
+Endpoints:
+  POST /v1/check   — auto-selects SGI or DGI based on whether context is provided
+  POST /v1/sgi     — explicit context-based grounding check
+  POST /v1/dgi     — explicit context-free grounding check
+  GET  /health     — liveness + model status
+"""
+from __future__ import annotations
+import time
+from contextlib import asynccontextmanager
+from typing import Optional
+from fastapi import FastAPI, HTTPException
+from fastapi.middleware.cors import CORSMiddleware
+from pydantic import BaseModel, Field, ConfigDict
+# ─────────────────────────────────────────────────────────────────────────────
+# Model preloading
+# ─────────────────────────────────────────────────────────────────────────────
+_model_ready = False
+_model_load_time: float = 0.0
+def _load_model() -> None:
+    """Import groundlens to trigger model download + warm the embedding cache."""
+    global _model_ready, _model_load_time
+    if _model_ready:
+        return
+    t0 = time.monotonic()
+    from groundlens import compute_dgi  # noqa: F401
+    # Warm up — first call loads the sentence-transformer model
+    compute_dgi(question="warmup", response="warmup")
+    _model_load_time = round(time.monotonic() - t0, 2)
+    _model_ready = True
+@asynccontextmanager
+async def lifespan(app: FastAPI):
+    """Load model at startup so first request is fast."""
+    _load_model()
+    yield
+# ─────────────────────────────────────────────────────────────────────────────
+# App
+# ─────────────────────────────────────────────────────────────────────────────
+app = FastAPI(
+    title="groundlens API",
+    description=(
+        "LLM hallucination detection using embedding geometry. "
+        "No second LLM. Deterministic. Same inputs → same scores."
+    ),
+    version="2026.5.12",
+    docs_url="/docs",
+    redoc_url="/redoc",
+    lifespan=lifespan,
+)
+app.add_middleware(
+    CORSMiddleware,
+    allow_origins=["*"],
+    allow_credentials=False,
+    allow_methods=["GET", "POST", "OPTIONS"],
+    allow_headers=["*"],
+)
+# ─────────────────────────────────────────────────────────────────────────────
+# Request / Response models
+# ─────────────────────────────────────────────────────────────────────────────
+class CheckRequest(BaseModel):
+    """Auto-select SGI or DGI based on whether context is provided."""
+    model_config = ConfigDict(str_strip_whitespace=True)
+    question: str = Field(
+        ...,
+        description="The question asked to the LLM",
+        min_length=1,
+        max_length=10_000,
+    )
+    response: str = Field(
+        ...,
+        description="The LLM's response to evaluate",
+        min_length=1,
+        max_length=50_000,
+    )
+    context: Optional[str] = Field(
+        default=None,
+        description=(
+            "Source material (document, RAG chunks, reference text). "
+            "If provided → SGI. If omitted → DGI."
+        ),
+        max_length=100_000,
+    )
+class SGIRequest(BaseModel):
+    """Explicit context-based grounding check."""
+    model_config = ConfigDict(str_strip_whitespace=True)
+    question: str = Field(..., min_length=1, max_length=10_000)
+    context: str = Field(..., min_length=1, max_length=100_000)
+    response: str = Field(..., min_length=1, max_length=50_000)
+class DGIRequest(BaseModel):
+    """Explicit context-free grounding check."""
+    model_config = ConfigDict(str_strip_whitespace=True)
+    question: str = Field(..., min_length=1, max_length=10_000)
+    response: str = Field(..., min_length=1, max_length=50_000)
+class SGIDetail(BaseModel):
+    q_dist: float
+    ctx_dist: float
+    interpretation: str
+class DGIDetail(BaseModel):
+    interpretation: str
+class GroundingResult(BaseModel):
+    verdict: str = Field(description="GROUNDED or HALLUCINATION RISK")
+    flagged: bool = Field(description="True if hallucination risk detected")
+    method: str = Field(description="SGI or DGI")
+    score: float = Field(description="Grounding score")
+    threshold: float = Field(description="Score threshold for flagging")
+    explanation: str = Field(description="Plain-language explanation")
+    detail: SGIDetail | DGIDetail
+    latency_ms: int = Field(description="Processing time in milliseconds")
+class HealthResponse(BaseModel):
+    status: str
+    model_loaded: bool
+    model_load_time_s: float
+    version: str
+# ─────────────────────────────────────────────────────────────────────────────
+# Helpers
+# ─────────────────────────────────────────────────────────────────────────────
+def _run_sgi(question: str, context: str, response: str) -> GroundingResult:
+    from groundlens import compute_sgi
+    t0 = time.monotonic()
+    result = compute_sgi(question=question, context=context, response=response)
+    latency = int((time.monotonic() - t0) * 1000)
+    return GroundingResult(
+        verdict="GROUNDED" if not result.flagged else "HALLUCINATION RISK",
+        flagged=result.flagged,
+        method="SGI (Semantic Grounding Index)",
+        score=round(result.value, 4),
+        threshold=0.95,
+        explanation=(
+            "The response appears grounded in the source material."
+            if not result.flagged
+            else "The response may not be based on the source material provided."
+        ),
+        detail=SGIDetail(
+            q_dist=round(result.q_dist, 4),
+            ctx_dist=round(result.ctx_dist, 4),
+            interpretation=result.explanation,
+        ),
+        latency_ms=latency,
+    )
+def _run_dgi(question: str, response: str) -> GroundingResult:
+    from groundlens import compute_dgi
+    t0 = time.monotonic()
+    result = compute_dgi(question=question, response=response)
+    latency = int((time.monotonic() - t0) * 1000)
+    return GroundingResult(
+        verdict="GROUNDED" if not result.flagged else "HALLUCINATION RISK",
+        flagged=result.flagged,
+        method="DGI (Directional Grounding Index)",
+        score=round(result.value, 4),
+        threshold=0.30,
+        explanation=(
+            "The response follows patterns typical of grounded answers."
+            if not result.flagged
+            else "The response shows geometric patterns associated with hallucination."
+        ),
+        detail=DGIDetail(
+            interpretation=result.explanation,
+        ),
+        latency_ms=latency,
+    )
+# ─────────────────────────────────────────────────────────────────────────────
+# Endpoints
+# ─────────────────────────────────────────────────────────────────────────────
+@app.get("/health", response_model=HealthResponse, tags=["system"])
+async def health():
+    """Liveness check. Returns model load status."""
+    return HealthResponse(
+        status="ok" if _model_ready else "loading",
+        model_loaded=_model_ready,
+        model_load_time_s=_model_load_time,
+        version="2026.5.12",
+    )
+@app.post("/v1/check", response_model=GroundingResult, tags=["grounding"])
+async def check(req: CheckRequest):
+    """Check whether an LLM response is hallucinated.
+    Auto-selects the right method:
+    - Context provided → SGI (checks if the response used the source material)
+    - No context → DGI (checks geometric grounding patterns)
+    """
+    if not _model_ready:
+        raise HTTPException(503, "Model is still loading. Try again in a few seconds.")
+    has_context = req.context is not None and req.context.strip() != ""
+    if has_context:
+        return _run_sgi(req.question, req.context, req.response)
+    else:
+        return _run_dgi(req.question, req.response)
+@app.post("/v1/sgi", response_model=GroundingResult, tags=["grounding"])
+async def sgi(req: SGIRequest):
+    """SGI — check if the response is grounded in a source document.
+    Use for RAG pipelines, document Q&A, or any case where you have
+    the source material the LLM was given.
+    """
+    if not _model_ready:
+        raise HTTPException(503, "Model is still loading. Try again in a few seconds.")
+    return _run_sgi(req.question, req.context, req.response)
+@app.post("/v1/dgi", response_model=GroundingResult, tags=["grounding"])
+async def dgi(req: DGIRequest):
+    """DGI — check grounding patterns without source context.
+    Use for open-ended chat, general Q&A, or any case where you just
+    have a question and the LLM's answer.
+    """
+    if not _model_ready:
+        raise HTTPException(503, "Model is still loading. Try again in a few seconds.")
+    return _run_dgi(req.question, req.response)

requirements.txt ADDED Viewed

	@@ -0,0 +1,5 @@

+groundlens>=2026.4.0
+fastapi>=0.115.0
+uvicorn[standard]>=0.30.0
+transformers>=4.40.0,<5.0.0
+torch>=2.0.0