Spaces:

sh4shv4t
/

Parlay

Paused

App Files Files Community

sh4shv4t commited on Apr 22

Commit

dd46a0d

1 Parent(s): f5f4abf

refactor(agent): migrate Gemini client from google-generativeai to google-genai

Browse files

Files changed (4) hide show

.cursorrules +2 -2
agent/gemini_client.py +64 -29
requirements.txt +1 -1
training/notebooks/parlay_training.ipynb +1 -1

.cursorrules CHANGED Viewed

@@ -12,8 +12,8 @@ NO Anthropic API anywhere. NO npm. NO build step.
 ## LLM Client Rules (Gemini)
 - Model: `gemini-2.0-flash` everywhere. Never use other model names in game/agent code.
-- Import: `import google.generativeai as genai` — never `anthropic`.
-- Configure once at module level: `genai.configure(api_key=os.environ["GOOGLE_API_KEY"])`.
 - ALL Gemini calls wrapped in try/except returning `SYNTHETIC_RESPONSE` on failure.
 - JSON extraction: always strip markdown fences before `json.loads()`.
 - Async Gemini calls: use `asyncio.get_event_loop().run_in_executor(None, lambda: ...)`.

 ## LLM Client Rules (Gemini)
 - Model: `gemini-2.0-flash` everywhere. Never use other model names in game/agent code.
+- Import: `from google import genai` and `from google.genai import types` — never `anthropic` or legacy `google.generativeai`.
+- Client: `genai.Client(api_key=os.environ.get("GOOGLE_API_KEY", ""))`; chats via `client.chats.create(model="gemini-2.0-flash", ...)`.
 - ALL Gemini calls wrapped in try/except returning `SYNTHETIC_RESPONSE` on failure.
 - JSON extraction: always strip markdown fences before `json.loads()`.
 - Async Gemini calls: use `asyncio.get_event_loop().run_in_executor(None, lambda: ...)`.

agent/gemini_client.py CHANGED Viewed

@@ -1,6 +1,6 @@
 """
 Google Gemini 2.0 Flash client for Parlay.
-All calls are async (via run_in_executor). All errors return SYNTHETIC_RESPONSE.
 """
 import asyncio
 import json
@@ -8,12 +8,41 @@ import logging
 import os
 from typing import Optional
-import google.generativeai as genai
 logger = logging.getLogger(__name__)
-genai.configure(api_key=os.environ.get("GOOGLE_API_KEY", ""))
-_model = genai.GenerativeModel("gemini-2.0-flash")
 SYNTHETIC_RESPONSE: dict = {
     "utterance": "I need a moment to consider your proposal.",
@@ -49,22 +78,25 @@ async def call_gemini(
             f'{{"utterance": "...", "offer_amount": <number or null>, '
             f'"tactical_move": <string or null>}}'
         )
-        loop = asyncio.get_event_loop()
-        chat = _model.start_chat(history=history)
-        response = await loop.run_in_executor(
-            None,
-            lambda: chat.send_message(
-                f"{full_prompt}\n\nUser: {last_msg}",
-                generation_config=genai.types.GenerationConfig(
                     max_output_tokens=max_tokens,
                     temperature=0.7,
                 ),
-            ),
-        )
-        text = response.text.strip()
         text = text.replace("```json", "").replace("```", "").strip()
         parsed = json.loads(text)
@@ -79,10 +111,10 @@ async def call_gemini(
     except json.JSONDecodeError:
         logger.warning("Gemini JSON parse failed — using text fallback")
-        try:
-            return {**SYNTHETIC_RESPONSE, "utterance": response.text[:300]}
-        except Exception:
-            return SYNTHETIC_RESPONSE
     except Exception as exc:
         logger.error(f"Gemini API error: {exc}")
         return SYNTHETIC_RESPONSE
@@ -117,19 +149,22 @@ async def call_gemini_tom(
     )
     try:
-        loop = asyncio.get_event_loop()
-        chat = _model.start_chat(history=conversation_history)
-        response = await loop.run_in_executor(
-            None,
-            lambda: chat.send_message(
                 tom_prompt,
-                generation_config=genai.types.GenerationConfig(
                     max_output_tokens=200,
                     temperature=0.3,
                 ),
-            ),
-        )
-        text = response.text.strip().replace("```json", "").replace("```", "").strip()
         return json.loads(text)
     except Exception as exc:
         logger.error(f"Gemini ToM inference error: {exc}")

 """
 Google Gemini 2.0 Flash client for Parlay.
+Uses the google-genai SDK. All calls are async (via run_in_executor). All errors return SYNTHETIC_RESPONSE.
 """
 import asyncio
 import json
 import os
 from typing import Optional
+from google import genai
+from google.genai import types
 logger = logging.getLogger(__name__)
+MODEL_ID = "gemini-2.0-flash"
+_client: Optional[genai.Client] = None
+def _get_client() -> genai.Client:
+    """Lazily construct API client (empty key is allowed; calls then fail and return synthetic output)."""
+    global _client
+    if _client is None:
+        _client = genai.Client(api_key=os.environ.get("GOOGLE_API_KEY") or "")
+    return _client
+def _legacy_messages_to_history(messages: list[dict]) -> list[types.Content]:
+    """Convert legacy {'role','parts'} messages to google-genai Content list."""
+    contents: list[types.Content] = []
+    for m in messages:
+        role = m.get("role", "user")
+        if role not in ("user", "model"):
+            role = "user"
+        raw_parts = m.get("parts") or []
+        parts: list[types.Part] = []
+        for p in raw_parts:
+            text = p if isinstance(p, str) else str(p)
+            parts.append(types.Part(text=text))
+        if not parts:
+            parts.append(types.Part(text=""))
+        contents.append(types.Content(role=role, parts=parts))
+    return contents
 SYNTHETIC_RESPONSE: dict = {
     "utterance": "I need a moment to consider your proposal.",
             f'{{"utterance": "...", "offer_amount": <number or null>, '
             f'"tactical_move": <string or null>}}'
         )
+        user_message = f"{full_prompt}\n\nUser: {last_msg}"
+        def _call() -> types.GenerateContentResponse:
+            chat = _get_client().chats.create(
+                model=MODEL_ID,
+                history=_legacy_messages_to_history(history),
+            )
+            return chat.send_message(
+                user_message,
+                config=types.GenerateContentConfig(
                     max_output_tokens=max_tokens,
                     temperature=0.7,
                 ),
+            )
+        loop = asyncio.get_event_loop()
+        response = await loop.run_in_executor(None, _call)
+        text = (response.text or "").strip()
         text = text.replace("```json", "").replace("```", "").strip()
         parsed = json.loads(text)
     except json.JSONDecodeError:
         logger.warning("Gemini JSON parse failed — using text fallback")
+        raw = text[:300] if text else ""
+        if raw:
+            return {**SYNTHETIC_RESPONSE, "utterance": raw}
+        return SYNTHETIC_RESPONSE
     except Exception as exc:
         logger.error(f"Gemini API error: {exc}")
         return SYNTHETIC_RESPONSE
     )
     try:
+        def _call() -> types.GenerateContentResponse:
+            chat = _get_client().chats.create(
+                model=MODEL_ID,
+                history=_legacy_messages_to_history(conversation_history),
+            )
+            return chat.send_message(
                 tom_prompt,
+                config=types.GenerateContentConfig(
                     max_output_tokens=200,
                     temperature=0.3,
                 ),
+            )
+        loop = asyncio.get_event_loop()
+        response = await loop.run_in_executor(None, _call)
+        text = (response.text or "").strip().replace("```json", "").replace("```", "").strip()
         return json.loads(text)
     except Exception as exc:
         logger.error(f"Gemini ToM inference error: {exc}")

requirements.txt CHANGED Viewed

@@ -3,7 +3,7 @@ uvicorn[standard]==0.45.0
 websockets==15.0.1
 pydantic>=2.11.7,<3.0.0
 aiosqlite==0.20.0
-google-generativeai>=0.8.0
 fastmcp==3.2.4
 numpy==1.26.4
 scikit-learn==1.4.2

 websockets==15.0.1
 pydantic>=2.11.7,<3.0.0
 aiosqlite==0.20.0
+google-genai>=1.0.0
 fastmcp==3.2.4
 numpy==1.26.4
 scikit-learn==1.4.2

training/notebooks/parlay_training.ipynb CHANGED Viewed

@@ -43,7 +43,7 @@
    "outputs": [],
    "source": [
     "# Cell 1: Install all dependencies\n",
-    "!pip install -q fastapi uvicorn websockets pydantic aiosqlite google-generativeai fastmcp numpy python-dotenv httpx\n",
     "!pip install -q trl peft transformers accelerate bitsandbytes datasets huggingface-hub\n",
     "!pip install -q matplotlib\n",
     "print('✓ All dependencies installed')"

    "outputs": [],
    "source": [
     "# Cell 1: Install all dependencies\n",
+    "!pip install -q fastapi uvicorn websockets pydantic aiosqlite google-genai fastmcp numpy python-dotenv httpx\n",
     "!pip install -q trl peft transformers accelerate bitsandbytes datasets huggingface-hub\n",
     "!pip install -q matplotlib\n",
     "print('✓ All dependencies installed')"