Spaces:

Jibrann
/

app

Runtime error

App Files Files Community

Jibrann commited on 23 days ago

Commit

77768cf

verified ·

1 Parent(s): 3ce9074

Upload folder using huggingface_hub

Browse files

Files changed (6) hide show

README.md +1 -0
inference.py +171 -41
server/app.py +13 -0
server/app_environment.py +22 -3
server/requirements.txt +2 -1
utils.py +2 -2

README.md CHANGED Viewed

@@ -8,5 +8,6 @@ sdk_version: "4.66"
 python_version: "3.13"
 app_file: server/app.py
 pinned: false
 base_path: /web
 ---

 python_version: "3.13"
 app_file: server/app.py
 pinned: false
+app_port: 8000
 base_path: /web
 ---

inference.py CHANGED Viewed

@@ -1,41 +1,171 @@
-import os
-import re
-import base64
-import textwrap
-from io import BytesIO
-from typing import List, Optional, Dict
-from openai import OpenAI
-import numpy as np
-from PIL import Image
-API_BASE_URL = os.getenv("API_BASE_URL")
-API_KEY = os.getenv("HF_TOKEN") or os.getenv("API_KEY")
-MODEL_NAME = os.getenv("MODEL_NAME")
-SYSTEM_PROMPT = textwrap.dedent(
-    """
-    You control a web browser through BrowserGym.
-    Reply with exactly one action string.
-    The action must be a valid BrowserGym command such as:
-    - noop()
-    - click('<BID>')
-    - type('selector', 'text to enter')
-    - fill('selector', 'text to enter')
-    - send_keys('Enter')
-    - scroll('down')
-    Use single quotes around string arguments.
-    When clicking, use the BrowserGym element IDs (BIDs) listed in the user message.
-    If you are unsure, respond with noop().
-    Do not include explanations or additional text.
-    """
-).strip()
-def main() -> None:
-    client = OpenAI(base_url=API_BASE_URL, api_key=API_KEY)
-if __name__ == "__main__":
-    main()

+import os
+from dotenv import load_dotenv
+from openai import OpenAI
+import json
+from json import JSONDecodeError
+import time
+try:
+    from models import AppAction, AppObservation
+except ImportError:
+    from app.models import AppAction, AppObservation
+try:
+    from server.app_environment import AppEnvironment
+except ImportError:
+    from app.server.app_environment import AppEnvironment
+load_dotenv()
+API_URL = os.getenv("API_BASE_URL")
+MODEL = os.getenv("MODEL_NAME")
+API_KEY = os.getenv("API_KEY") or os.getenv("HF_TOKEN")
+MAX_STEPS = 8
+TEMPERATURE = 0.2
+FALLBACK_ACTION = {
+    "isSegmentation": False,
+    "placement": {},
+    "findObjects": {},
+}
+DEBUG = True
+SYSTEM_PROMPT = """
+        You are an intelligent agent controlling a 3D object placement environment. Your task is to:
+        1. **Segment objects** in the environment if `isSegmentation=True`.
+        2. **Identify objects** and their properties (name, stackable) accurately.
+        3. **Place objects** in the 3D grid respecting stacking rules and dimensions.
+        4. **Use rewards and feedback** from previous steps to improve future actions.
+        You must strictly return actions that conform to this Pydantic schema:
+        AppAction:
+        {
+            placement: Dict[str, Tuple[int, int, int, bool]]
+            isSegmentation: bool
+            findObjects: Dict[str, Tuple[int, int, int, bool]]
+        }
+        Rules:
+        - Only report objects that are found or placed; empty dicts are valid if none.
+        - Do not modify objects that are already placed unless instructed.
+        - Coordinates must be within the grid bounds.
+        - Respect stackable property: non-stackable objects cannot be placed on top of another object.
+        - Use previous step’s reward and rewardFeedback to adjust your strategy.
+        Output:
+        - Always return a valid JSON object conforming to the schema.
+        - Do not include any extra text, explanations, or commentary.
+        - If no action is possible, return empty dicts for `placement` and `findObjects`.
+        Your goal:
+        - Maximize cumulative reward.
+        - Identify all objects correctly.
+        - Place objects efficiently while respecting stacking rules.
+        - Learn from reward feedback to improve placement in future steps.
+        Always return a valid JSON that conforms exactly to the AppAction Pydantic model:
+        {"placement": Dict[str, Tuple[int,int,int,bool]] or {}, "isSegmentation": bool, "findObjects": Dict[str, Tuple[int,int,int,bool]] or {}}
+        Actions:
+        - To place an object: {"isSegmentation": false, "placement": {"object_name": [x, y, z, stackable]}, "findObjects": {}}
+        - To segment objects: {"isSegmentation": true, "placement": {}, "findObjects": {"object_name": [x, y, z, stackable]}}
+        Do not include explanations, text, or extra fields.
+        If no objects are found or placed, return empty dicts for placement and findObjects.
+        The output must be parseable and valid for AppAction(**json_output).
+    """.strip()
+MESSAGES = [{"role": "system", "content": SYSTEM_PROMPT}]
+HISTORY = []
+def _fallback_action() -> AppAction:
+    return AppAction(**FALLBACK_ACTION)
+def _extract_json_payload(output_str: str) -> str:
+    output_str = output_str.strip()
+    if output_str.startswith("```"):
+        lines = output_str.splitlines()
+        if len(lines) >= 3:
+            output_str = "\n".join(lines[1:-1]).strip()
+    start = output_str.find("{")
+    end = output_str.rfind("}")
+    if start == -1 or end == -1 or end < start:
+        raise JSONDecodeError("No JSON object found in model output", output_str, 0)
+    return output_str[start : end + 1]
+def parse_output(output_str: str) -> AppAction:
+    try:
+        data = json.loads(_extract_json_payload(output_str))
+        return AppAction(**data)
+    except (JSONDecodeError, TypeError, ValueError) as exc:
+        print(f"Invalid Output: {exc}")
+        print(f"Raw model output: {output_str!r}")
+        return _fallback_action()
+def main() -> None:
+    if not API_URL or not MODEL or not API_KEY:
+        missing = [
+            name
+            for name, value in (
+                ("API_BASE_URL", API_URL),
+                ("MODEL_NAME", MODEL),
+                ("API_KEY/HF_TOKEN", API_KEY),
+            )
+            if not value
+        ]
+        raise RuntimeError(f"Missing required environment variables: {', '.join(missing)}")
+    env = AppEnvironment()
+    observation: AppObservation = env.reset()
+    client = OpenAI(
+        base_url=API_URL,
+        api_key=API_KEY,
+    )
+    for i in range(1, MAX_STEPS + 1):
+        MESSAGES.append(
+            {
+                "role": "user",
+                "content": f"""Observation: {observation.model_dump_json()},
+                    Previous reward: {observation.reward},
+                    Previous reward list: {observation.rewardList},
+                    Previous reward feedback: {observation.rewardFeedback},
+                    Step: {i}""".strip(),
+            }
+        )
+        llm_output = client.chat.completions.create(
+            model=MODEL,
+            messages=MESSAGES,
+            temperature=TEMPERATURE,
+        )
+        message_content = llm_output.choices[0].message.content or ""
+        action: AppAction = parse_output(message_content)
+        MESSAGES.append({"role": "assistant", "content": message_content})
+        observation: AppObservation = env.step(action)
+        HISTORY.append(observation)
+        if observation.isDone:
+            break
+        time.sleep(10000)
+    print(HISTORY)
+if __name__ == "__main__":
+    main()

server/app.py CHANGED Viewed

@@ -22,6 +22,19 @@ app = create_app(
 )
 def main(host: str = "0.0.0.0", port: int = 8000):
     """
     Entry point for direct execution via uv run or python -m.

 )
+@app.get("/health")
+def health() -> dict[str, str]:
+    return {"status": "ok"}
+@app.get("/")
+def root() -> dict[str, str]:
+    return {
+        "message": "Object Placer API is running",
+        "health": "/health",
+    }
 def main(host: str = "0.0.0.0", port: int = 8000):
     """
     Entry point for direct execution via uv run or python -m.

server/app_environment.py CHANGED Viewed

@@ -59,15 +59,34 @@ class AppEnvironment(Environment):
         self._state.step_count += 1
         reward = 0.0
-        if action.isSegmentation:
             reward += 10.0
             appendRewardFeedback(self._state, "Segmentation successful.", reward)
-        if action.placement:
             reward += place(action.isSegmentation, action.placement, self._state)
             appendRewardFeedback(self._state, "Object placed successfully.", reward)
-        if action.findObjects:
             reward += findobject(action.isSegmentation, action.findObjects, self._state)
             appendRewardFeedback(self._state, "Object found successfully.", reward)

         self._state.step_count += 1
         reward = 0.0
+        if action is None:
+            reward -= 10.0
+            appendRewardFeedback(
+                self._state,
+                "No action is of invalid schema or format. Penalty applied.",
+                reward,
+            )
+            return AppObservation(
+                currentGrid=self._state.currentGrid,
+                positions=self._state.ObjectsPresent,
+                objectsLeft=self._state.objectsLeft,
+                objectsFound=self._state.objectsFound,
+                reward=self._state.reward,
+                isDone=self._state.isDone,
+                rewardFeedback=self._state.rewardFeedback,
+                rewardList=self._state.rewardList,
+            )
+        if action.isSegmentation and action is not None:
             reward += 10.0
             appendRewardFeedback(self._state, "Segmentation successful.", reward)
+        if action.placement and action is not None:
             reward += place(action.isSegmentation, action.placement, self._state)
             appendRewardFeedback(self._state, "Object placed successfully.", reward)
+        if action.findObjects and action is not None:
             reward += findobject(action.isSegmentation, action.findObjects, self._state)
             appendRewardFeedback(self._state, "Object found successfully.", reward)

server/requirements.txt CHANGED Viewed

@@ -3,4 +3,5 @@ fastapi
 uvicorn
 numpy
 scikit-learn
-matplotlib

 uvicorn
 numpy
 scikit-learn
+matplotlib
+python-dotenv

utils.py CHANGED Viewed

@@ -141,7 +141,7 @@ def place(segment, objects, state):
     totalObjs = len(objects)
     reward_per_obj_placed = 45.0 / totalObjs
-    if segment:
         appendRewardFeedback(
             state, "Placing objects without segmentation is not allowed.", -60.0
         )
@@ -237,7 +237,7 @@ def place(segment, objects, state):
 def findobject(segment, objects, state):
-    if not segment:
         appendRewardFeedback(
             state, "Finding objects without segmentation is not allowed.", -60.0
         )

     totalObjs = len(objects)
     reward_per_obj_placed = 45.0 / totalObjs
+    if segment or segment is None:
         appendRewardFeedback(
             state, "Placing objects without segmentation is not allowed.", -60.0
         )
 def findobject(segment, objects, state):
+    if not segment or segment is None:
         appendRewardFeedback(
             state, "Finding objects without segmentation is not allowed.", -60.0
         )