Spaces:

umanggarg
/

cartographer

Running

App Files Files Community

umanggarg commited on 17 days ago

Commit

a63e301

1 Parent(s): 7de7656

Switch embeddings to Gemini

Browse files

Files changed (7) hide show

backend/config.py +12 -7
backend/dependencies.py +0 -3
backend/routers/agent.py +6 -1
backend/routers/ingestion.py +6 -5
backend/services/agent.py +81 -49
ingestion/embedder.py +125 -32
ui/package.json +3 -0

backend/config.py CHANGED Viewed

@@ -32,21 +32,26 @@ class Settings:
     github_token: str       = os.getenv("GITHUB_TOKEN", "")
     # ── Embeddings ────────────────────────────────────────────────────────────
-    # Two embedding providers, selected at startup:
     #
-    # 1. Voyage AI (VOYAGE_API_KEY set + EMBEDDING_MODEL=voyage-code-3)
     #    voyage-code-3: code-optimised, 1024-dim, 200M tokens/month free.
     #    ⚠️  Requires EMBEDDING_DIM=1024 and a NEW Qdrant collection — dims
-    #    are incompatible with nomic (768-dim) collections.
     #
-    # 2. Nomic API (default, NOMIC_API_KEY required)
-    #    nomic-embed-text-v1.5: general text, 768-dim, generous free tier.
-    #    Free at https://atlas.nomic.ai (no credit card needed).
     #
     # EMBEDDING_DIM must match the chosen model exactly.
     nomic_api_key: str      = os.getenv("NOMIC_API_KEY", "")
     voyage_api_key: str     = os.getenv("VOYAGE_API_KEY", "")
-    embedding_model: str    = os.getenv("EMBEDDING_MODEL", "nomic-embed-text-v1.5")
     embedding_dim: int      = int(os.getenv("EMBEDDING_DIM", "768"))
     # ── Chunking ──────────────────────────────────────────────────────────────

     github_token: str       = os.getenv("GITHUB_TOKEN", "")
     # ── Embeddings ────────────────────────────────────────────────────────────
+    # Three embedding providers, selected at startup by EMBEDDING_MODEL:
     #
+    # 1. Gemini (default — EMBEDDING_MODEL contains "gemini", needs GEMINI_API_KEY)
+    #    gemini-embedding-001: 768-dim output via MRL, generous free tier.
+    #    Re-uses the same GEMINI_API_KEY used for the LLM — no extra signup.
+    #    Free at https://aistudio.google.com.
+    #
+    # 2. Voyage AI (EMBEDDING_MODEL contains "voyage", needs VOYAGE_API_KEY)
     #    voyage-code-3: code-optimised, 1024-dim, 200M tokens/month free.
     #    ⚠️  Requires EMBEDDING_DIM=1024 and a NEW Qdrant collection — dims
+    #    are incompatible with 768-dim collections.
     #
+    # 3. Nomic (legacy fallback — NOMIC_API_KEY set)
+    #    nomic-embed-text-v1.5: 768-dim. Free quota is 10M tokens TOTAL
+    #    (not per month) — easy to exhaust across a few large indexes.
     #
     # EMBEDDING_DIM must match the chosen model exactly.
     nomic_api_key: str      = os.getenv("NOMIC_API_KEY", "")
     voyage_api_key: str     = os.getenv("VOYAGE_API_KEY", "")
+    embedding_model: str    = os.getenv("EMBEDDING_MODEL", "gemini-embedding-001")
     embedding_dim: int      = int(os.getenv("EMBEDDING_DIM", "768"))
     # ── Chunking ──────────────────────────────────────────────────────────────

backend/dependencies.py CHANGED Viewed

@@ -113,9 +113,6 @@ def check_rate_limit(request: Request) -> None:
     window = _rate_windows[ip]
     while window and window[0] < now - 60:
         window.popleft()
-    if not window:
-        del _rate_windows[ip]
-        return
     if len(window) >= limit:
         raise HTTPException(

     window = _rate_windows[ip]
     while window and window[0] < now - 60:
         window.popleft()
     if len(window) >= limit:
         raise HTTPException(

backend/routers/agent.py CHANGED Viewed

@@ -52,7 +52,12 @@ async def agent_query(
 ):
     """Run the agentic RAG loop synchronously via MCP tools."""
     try:
-        result = await agent_svc.run(request.question, repo_filter=request.repo)
         return AgentResponse(
             answer=result["answer"],
             tool_calls=[AgentToolCall(**tc) for tc in result["tool_calls"]],

 ):
     """Run the agentic RAG loop synchronously via MCP tools."""
     try:
+        result = await agent_svc.run(
+            request.question,
+            repo_filter=request.repo,
+            history=request.history,
+            model_id=request.model_id,
+        )
         return AgentResponse(
             answer=result["answer"],
             tool_calls=[AgentToolCall(**tc) for tc in result["tool_calls"]],

backend/routers/ingestion.py CHANGED Viewed

@@ -92,15 +92,16 @@ async def ingest_stream(repo: str, request: Request, force: bool = False):
     async def _run():
         try:
-            await asyncio.to_thread(services.ingestion.ingest, repo, force, _progress)
             if services.diagram:
-                services.diagram.invalidate(repo)
             if services.repo_map:
-                services.repo_map.invalidate(repo)
             now = datetime.now(timezone.utc).isoformat()
-            repo_indexed_at[repo] = now
             if force:
-                repo_contextual_at[repo] = now
         except Exception as e:
             loop.call_soon_threadsafe(queue.put_nowait, {"step": "error", "detail": str(e)})
         finally:

     async def _run():
         try:
+            result = await asyncio.to_thread(services.ingestion.ingest, repo, force, _progress)
+            repo_slug = result.get("repo", repo)
             if services.diagram:
+                services.diagram.invalidate(repo_slug)
             if services.repo_map:
+                services.repo_map.invalidate(repo_slug)
             now = datetime.now(timezone.utc).isoformat()
+            repo_indexed_at[repo_slug] = now
             if force:
+                repo_contextual_at[repo_slug] = now
         except Exception as e:
             loop.call_soon_threadsafe(queue.put_nowait, {"step": "error", "detail": str(e)})
         finally:

backend/services/agent.py CHANGED Viewed

@@ -516,6 +516,10 @@ class AgentService:
         """
         self.mcp          = mcp_client
         self._repo_map    = repo_map_svc
         # ── Provider detection ─────────────────────────────────────────────────
         # Priority: Cerebras (Qwen3-235B) → Gemini → OpenRouter → Anthropic → Groq.
@@ -566,65 +570,82 @@ class AgentService:
     # ── Public API ─────────────────────────────────────────────────────────────
-    async def run(self, question: str, repo_filter: str | None = None, history: list[dict] | None = None) -> dict:
         """
         Run the full ReAct loop and return the final answer + trace.
         Returns:
             {"answer": str, "tool_calls": list[dict], "iterations": int}
         """
-        # Discover tools from MCP server
-        mcp_tools  = await self.mcp.list_tools()
-        messages   = self._build_initial_messages(question, repo_filter, history)
-        tool_trace = []
-        # Loop detection: track (tool, args) pairs already executed this run.
-        # Prevents wasting all MAX_ITERATIONS on duplicate searches when the
-        # model gets confused and repeats the same call over and over.
-        seen_calls: set[tuple] = set()
-        for iteration in range(self.MAX_ITERATIONS):
-            # LLM call is synchronous — run in thread pool to avoid blocking
-            # Pass raw mcp_tools so _call_llm can reformat if provider switches mid-run
-            step = await asyncio.to_thread(self._call_llm, messages, mcp_tools)
-            if step["done"]:
-                return {
-                    "answer":     step["answer"],
-                    "tool_calls": tool_trace,
-                    "iterations": iteration + 1,
-                }
-            messages.append(step["assistant_message"])
-            for tc in step["tool_calls"]:
-                # Deduplicate: skip calls already made with identical arguments.
-                call_key = (tc["name"], tuple(sorted(tc["input"].items())))
-                if call_key in seen_calls:
-                    result = f"[Skipped duplicate {tc['name']} call — already ran with these arguments]"
-                    tool_trace.append({"tool": tc["name"], "input": tc["input"], "output": result})
-                    messages.append(self._build_tool_result(tc["id"], tc["name"], result))
-                    continue
-                seen_calls.add(call_key)
-                # Tool execution via MCP protocol (async HTTP)
-                try:
-                    result = await self.mcp.call_tool(tc["name"], tc["input"])
-                except Exception as e:
-                    result = f"Tool error: {e}"
-                tool_trace.append({
-                    "tool":   tc["name"],
-                    "input":  tc["input"],
-                    "output": result[:500] + "..." if len(result) > 500 else result,
-                })
-                messages.append(self._build_tool_result(tc["id"], tc["name"], result))
-        return {
-            "answer":     "I was unable to fully answer within the allowed reasoning steps.",
-            "tool_calls": tool_trace,
-            "iterations": self.MAX_ITERATIONS,
-        }
     async def stream(
         self,
@@ -655,6 +676,17 @@ class AgentService:
           we re-run with stream=True so tokens arrive in real time.
           This is one extra LLM call but delivers genuine streaming UX.
         """
         # ── Per-request model override ────────────────────────────────────────
         # If the user selected a specific model in the UI, temporarily swap to it.
         # We save/restore self._client/provider/model in a finally block so the

         """
         self.mcp          = mcp_client
         self._repo_map    = repo_map_svc
+        # Provider fallback and per-request model selection mutate the active
+        # client/provider/model fields. Serialise runs so concurrent requests
+        # cannot leak one user's selected model into another user's session.
+        self._run_lock    = asyncio.Lock()
         # ── Provider detection ─────────────────────────────────────────────────
         # Priority: Cerebras (Qwen3-235B) → Gemini → OpenRouter → Anthropic → Groq.
     # ── Public API ─────────────────────────────────────────────────────────────
+    async def run(
+        self,
+        question: str,
+        repo_filter: str | None = None,
+        history: list[dict] | None = None,
+        model_id: str | None = None,
+    ) -> dict:
         """
         Run the full ReAct loop and return the final answer + trace.
         Returns:
             {"answer": str, "tool_calls": list[dict], "iterations": int}
         """
+        async with self._run_lock:
+            _orig = (self._client, self._provider, self._model)
+            entry = next((m for m in AGENT_MODELS if m["id"] == model_id), None)
+            if entry:
+                self._client   = _make_client(entry)
+                self._provider = entry["provider"]
+                self._model    = entry["model"]
+            try:
+                # Discover tools from MCP server
+                mcp_tools  = await self.mcp.list_tools()
+                messages   = self._build_initial_messages(question, repo_filter, history)
+                tool_trace = []
+                # Loop detection: track (tool, args) pairs already executed this run.
+                # Prevents wasting all MAX_ITERATIONS on duplicate searches when the
+                # model gets confused and repeats the same call over and over.
+                seen_calls: set[tuple] = set()
+                for iteration in range(self.MAX_ITERATIONS):
+                    # LLM call is synchronous — run in thread pool to avoid blocking
+                    # Pass raw mcp_tools so _call_llm can reformat if provider switches mid-run
+                    step = await asyncio.to_thread(self._call_llm, messages, mcp_tools)
+                    if step["done"]:
+                        return {
+                            "answer":     step["answer"],
+                            "tool_calls": tool_trace,
+                            "iterations": iteration + 1,
+                        }
+                    messages.append(step["assistant_message"])
+                    for tc in step["tool_calls"]:
+                        # Deduplicate: skip calls already made with identical arguments.
+                        call_key = (tc["name"], tuple(sorted(tc["input"].items())))
+                        if call_key in seen_calls:
+                            result = f"[Skipped duplicate {tc['name']} call — already ran with these arguments]"
+                            tool_trace.append({"tool": tc["name"], "input": tc["input"], "output": result})
+                            messages.append(self._build_tool_result(tc["id"], tc["name"], result))
+                            continue
+                        seen_calls.add(call_key)
+                        # Tool execution via MCP protocol (async HTTP)
+                        try:
+                            result = await self.mcp.call_tool(tc["name"], tc["input"])
+                        except Exception as e:
+                            result = f"Tool error: {e}"
+                        tool_trace.append({
+                            "tool":   tc["name"],
+                            "input":  tc["input"],
+                            "output": result[:500] + "..." if len(result) > 500 else result,
+                        })
+                        messages.append(self._build_tool_result(tc["id"], tc["name"], result))
+                return {
+                    "answer":     "I was unable to fully answer within the allowed reasoning steps.",
+                    "tool_calls": tool_trace,
+                    "iterations": self.MAX_ITERATIONS,
+                }
+            finally:
+                self._client, self._provider, self._model = _orig
     async def stream(
         self,
           we re-run with stream=True so tokens arrive in real time.
           This is one extra LLM call but delivers genuine streaming UX.
         """
+        async with self._run_lock:
+            async for event in self._stream_locked(question, repo_filter, history, model_id):
+                yield event
+    async def _stream_locked(
+        self,
+        question: str,
+        repo_filter: str | None = None,
+        history: list[dict] | None = None,
+        model_id: str | None = None,
+    ) -> AsyncIterator[dict]:
         # ── Per-request model override ────────────────────────────────────────
         # If the user selected a specific model in the UI, temporarily swap to it.
         # We save/restore self._client/provider/model in a finally block so the

ingestion/embedder.py CHANGED Viewed

@@ -1,38 +1,45 @@
 """
-embedder.py — Embed code chunks via Voyage AI or Nomic API.
 WHY API-BASED EMBEDDINGS
 ─────────────────────────
-The local sentence-transformers model (nomic-embed-code) is ~600MB RAM.
-That kills free-tier hosting (HF Spaces, Render: 512MB–1GB RAM limit).
-Both APIs use the same underlying model — vectors are equivalent quality.
-Zero RAM cost on our server, just network latency (~200ms/batch).
-TWO PROVIDERS, ONE INTERFACE
 ──────────────────────────────
-Provider selection happens at init time, based on env vars:
-  VOYAGE_API_KEY set + EMBEDDING_MODEL=voyage-code-3
     → Voyage AI: code-optimised, 1024-dim, 200M tokens/month free.
       voyage-code-3 is specifically trained on code and outperforms
       general-purpose embedders on code retrieval benchmarks.
-      ⚠️  Requires new Qdrant collection (dim mismatch with 768-dim).
-  NOMIC_API_KEY set (default)
-    → Nomic API: nomic-embed-text-v1.5, 768-dim, generous free tier.
 TASK TYPES
 ───────────
-Both APIs distinguish between document and query roles:
-  - "search_document" / "document": used when indexing chunks
-  - "search_query"   / "query":     used when embedding user queries
-This produces a better inner-product space than treating both the same.
 BATCHING
 ─────────
-Both APIs accept up to 256-512 texts per call. We batch in groups of 96
-(conservative) to avoid timeout on large text chunks over free-tier networks.
 """
 import time
@@ -45,11 +52,12 @@ sys.path.insert(0, str(Path(__file__).parent.parent))
 from backend.config import settings
-_NOMIC_API_URL  = "https://api-atlas.nomic.ai/v1/embedding/text"
-_BATCH_SIZE     = 32    # Nomic has a ~10MB request body limit; 32 chunks keeps us safe
-                        # even for large contextually-enriched chunks (~8KB each)
-_MAX_CHARS      = 8000  # truncate each text before sending — embeddings degrade
-                        # gracefully on truncation, and models have a token limit anyway
 class Embedder:
@@ -69,13 +77,25 @@ class Embedder:
         self.model_name    = model_name or settings.embedding_model
         self.embedding_dim = settings.embedding_dim
-        # Select provider based on available keys + model name
-        if settings.voyage_api_key and "voyage" in self.model_name.lower():
             self._provider = "voyage"
             self._init_voyage()
-        else:
             self._provider = "nomic"
             self._init_nomic()
     def _init_voyage(self):
         """Initialise Voyage AI client. voyage-code-3 is code-optimised 1024-dim."""
@@ -93,18 +113,23 @@ class Embedder:
     def _init_nomic(self):
         """Initialise Nomic API client. nomic-embed-text-v1.5 is 768-dim."""
-        if not settings.nomic_api_key:
-            raise RuntimeError(
-                "No embedding provider configured. "
-                "Set NOMIC_API_KEY (free at https://atlas.nomic.ai) or "
-                "VOYAGE_API_KEY + EMBEDDING_MODEL=voyage-code-3."
-            )
         self._nomic_key = settings.nomic_api_key
         print(
             f"Embedder: using Nomic API ({self.model_name}, {self.embedding_dim}-dim). "
             "No local model loaded."
         )
     # ── Public interface ───────────────────────────────────────────────────────
     def embed_chunks(self, chunks: list[dict]) -> list[list[float]]:
@@ -123,6 +148,8 @@ class Embedder:
         texts = [c["text"][:_MAX_CHARS] for c in chunks]
         if self._provider == "voyage":
             return self._voyage_embed(texts, input_type="document")
         return self._nomic_embed(texts, task_type="search_document")
     def embed_query(self, query: str) -> list[float]:
@@ -134,6 +161,8 @@ class Embedder:
         """
         if self._provider == "voyage":
             return self._voyage_embed([query], input_type="query")[0]
         return self._nomic_embed([query], task_type="search_query")[0]
     # ── Voyage AI implementation ───────────────────────────────────────────────
@@ -231,3 +260,67 @@ class Embedder:
             return response.json()["embeddings"]
         raise RuntimeError("Nomic API call failed after retries")

 """
+embedder.py — Embed code chunks via a hosted embedding API.
 WHY API-BASED EMBEDDINGS
 ─────────────────────────
+Local sentence-transformers models are ~600MB RAM — enough to kill
+free-tier hosting (HF Spaces, Render: 512MB–1GB RAM limit). Hosted
+APIs give us zero RAM cost and equivalent quality, at the price of
+~200ms of network latency per batch.
+THREE PROVIDERS, ONE INTERFACE
 ──────────────────────────────
+Provider is selected from EMBEDDING_MODEL at init:
+  EMBEDDING_MODEL contains "voyage" + VOYAGE_API_KEY set
     → Voyage AI: code-optimised, 1024-dim, 200M tokens/month free.
       voyage-code-3 is specifically trained on code and outperforms
       general-purpose embedders on code retrieval benchmarks.
+      ⚠️  Requires EMBEDDING_DIM=1024 and a new Qdrant collection.
+  EMBEDDING_MODEL contains "gemini" + GEMINI_API_KEY set  (default)
+    → Google Gemini: gemini-embedding-001, 768-dim output (configurable
+      via MRL), generous free tier. Re-uses the same GEMINI_API_KEY we
+      use for the LLM — no separate signup.
+  NOMIC_API_KEY set  (legacy fallback)
+    → Nomic API: nomic-embed-text-v1.5, 768-dim. Free quota is 10M
+      tokens total — easy to exhaust across a few large repo indexes.
 TASK TYPES
 ───────────
+Every provider distinguishes document and query roles. A document
+projection and a query projection live in the same embedding space
+but are optimised for their direction of the inner product:
+  - document:  used when indexing chunks
+  - query:     used when embedding the user's question
 BATCHING
 ─────────
+All three APIs accept batched input. We use groups of 32 to stay
+well under request-body size limits on large contextually-enriched
+chunks (~8KB each) and to keep individual retries cheap.
 """
 import time
 from backend.config import settings
+_NOMIC_API_URL   = "https://api-atlas.nomic.ai/v1/embedding/text"
+_GEMINI_API_BASE = "https://generativelanguage.googleapis.com/v1beta/models"
+_BATCH_SIZE      = 32    # conservative for all providers: stays under ~10MB body
+                         # and keeps each failed batch cheap to retry
+_MAX_CHARS       = 8000  # truncate each text before sending — embeddings degrade
+                         # gracefully on truncation and models silently clip anyway
 class Embedder:
         self.model_name    = model_name or settings.embedding_model
         self.embedding_dim = settings.embedding_dim
+        # Provider selection is driven by the MODEL NAME, with the available
+        # API key gating the choice. This lets an operator flip providers by
+        # only changing EMBEDDING_MODEL in .env — no code change needed.
+        name = self.model_name.lower()
+        if "voyage" in name and settings.voyage_api_key:
             self._provider = "voyage"
             self._init_voyage()
+        elif "gemini" in name and settings.gemini_api_key:
+            self._provider = "gemini"
+            self._init_gemini()
+        elif settings.nomic_api_key:
             self._provider = "nomic"
             self._init_nomic()
+        else:
+            raise RuntimeError(
+                f"No embedding provider available for model '{self.model_name}'. "
+                "Set GEMINI_API_KEY (default — free at https://aistudio.google.com), "
+                "or VOYAGE_API_KEY + EMBEDDING_MODEL=voyage-code-3."
+            )
     def _init_voyage(self):
         """Initialise Voyage AI client. voyage-code-3 is code-optimised 1024-dim."""
     def _init_nomic(self):
         """Initialise Nomic API client. nomic-embed-text-v1.5 is 768-dim."""
         self._nomic_key = settings.nomic_api_key
         print(
             f"Embedder: using Nomic API ({self.model_name}, {self.embedding_dim}-dim). "
             "No local model loaded."
         )
+    def _init_gemini(self):
+        """Initialise Gemini embeddings. gemini-embedding-001 supports MRL,
+        so we request exactly `embedding_dim` dimensions from the API — that
+        way one deployment can reuse an existing Qdrant collection schema
+        (768-dim) or scale up to a larger one without code changes."""
+        self._gemini_key = settings.gemini_api_key
+        print(
+            f"Embedder: using Gemini API ({self.model_name}, {self.embedding_dim}-dim). "
+            "No local model loaded."
+        )
     # ── Public interface ───────────────────────────────────────────────────────
     def embed_chunks(self, chunks: list[dict]) -> list[list[float]]:
         texts = [c["text"][:_MAX_CHARS] for c in chunks]
         if self._provider == "voyage":
             return self._voyage_embed(texts, input_type="document")
+        if self._provider == "gemini":
+            return self._gemini_embed(texts, task_type="RETRIEVAL_DOCUMENT")
         return self._nomic_embed(texts, task_type="search_document")
     def embed_query(self, query: str) -> list[float]:
         """
         if self._provider == "voyage":
             return self._voyage_embed([query], input_type="query")[0]
+        if self._provider == "gemini":
+            return self._gemini_embed([query], task_type="RETRIEVAL_QUERY")[0]
         return self._nomic_embed([query], task_type="search_query")[0]
     # ── Voyage AI implementation ───────────────────────────────────────────────
             return response.json()["embeddings"]
         raise RuntimeError("Nomic API call failed after retries")
+    # ── Gemini API implementation ──────────────────────────────────────────────
+    def _gemini_embed(self, texts: list[str], task_type: str) -> list[list[float]]:
+        """Call Gemini batchEmbedContents with batching. Returns list of
+        `embedding_dim`-dim vectors.
+        task_type is the Gemini task enum (RETRIEVAL_DOCUMENT / RETRIEVAL_QUERY).
+        These produce different projections within the same embedding space —
+        the document projection is optimised for being retrieved, the query
+        projection for doing the retrieving.
+        """
+        all_embeddings: list[list[float]] = []
+        for i in range(0, len(texts), _BATCH_SIZE):
+            batch      = [t[:_MAX_CHARS] for t in texts[i : i + _BATCH_SIZE]]
+            embeddings = self._gemini_call_api(batch, task_type)
+            all_embeddings.extend(embeddings)
+        return all_embeddings
+    def _gemini_call_api(
+        self,
+        texts: list[str],
+        task_type: str,
+        retries: int = 3,
+    ) -> list[list[float]]:
+        """
+        Single Gemini batchEmbedContents call with retry on rate limit (429)
+        or service error (503). Gemini free tier is RPM-capped, so backoff is
+        more aggressive than Nomic (3 retries vs 2, longer default wait).
+        Response shape:
+          { "embeddings": [{ "values": [float, ...] }, ...] }
+        """
+        url = (
+            f"{_GEMINI_API_BASE}/{self.model_name}:batchEmbedContents"
+            f"?key={self._gemini_key}"
+        )
+        model_id = f"models/{self.model_name}"
+        payload = {
+            "requests": [
+                {
+                    "model":                model_id,
+                    "content":              {"parts": [{"text": t}]},
+                    "taskType":             task_type,
+                    "outputDimensionality": self.embedding_dim,
+                }
+                for t in texts
+            ]
+        }
+        for attempt in range(retries + 1):
+            response = http.post(url, json=payload, timeout=60)
+            if response.status_code in (429, 503) and attempt < retries:
+                # Gemini doesn't always send Retry-After; back off exponentially.
+                wait = int(response.headers.get("Retry-After", 2 ** attempt * 5))
+                print(f"Gemini API {response.status_code}. Waiting {wait}s before retry...")
+                time.sleep(wait)
+                continue
+            response.raise_for_status()
+            return [e["values"] for e in response.json()["embeddings"]]
+        raise RuntimeError("Gemini API call failed after retries")

ui/package.json CHANGED Viewed

@@ -3,6 +3,9 @@
   "private": true,
   "version": "0.0.0",
   "type": "module",
   "scripts": {
     "dev": "vite",
     "build": "vite build",

   "private": true,
   "version": "0.0.0",
   "type": "module",
+  "engines": {
+    "node": ">=20"
+  },
   "scripts": {
     "dev": "vite",
     "build": "vite build",