Spaces:

rahul24raj
/

fish_farm_env

Sleeping

File size: 7,239 Bytes

"""FastAPI application for the Fish Farm OpenEnv environment.

Uses the official openenv create_fastapi_app() which auto-generates:
  /ws, /reset, /step, /state, /health, /web, /docs, /schema

Custom endpoints added for hackathon compliance:
  /tasks   - List all tasks with action schema
  /grader  - Grade a completed episode
  /baseline - Run heuristic baseline on task(s)

Run locally:
    uvicorn src.agentic_rl.server.app:app --reload --port 8000
"""

import sys
import os
from dataclasses import asdict
from typing import Any, Dict, List, Optional

from fastapi import HTTPException
from openenv.core.env_server import create_fastapi_app
from pydantic import BaseModel

from .environment import FishFarmEnvironment
from ..models import FarmAction, FarmObservation
from ..tasks import get_task, list_all_tasks, TASKS

# Add project root to path so graders module is importable
_project_root = os.path.abspath(os.path.join(os.path.dirname(__file__), "..", "..", ".."))
if _project_root not in sys.path:
    sys.path.insert(0, _project_root)

from graders.farm_graders import FarmGrader  # noqa: E402

app = create_fastapi_app(
    env=FishFarmEnvironment,
    action_cls=FarmAction,
    observation_cls=FarmObservation,
)


# ---------------------------------------------------------------------------
# Custom endpoints required by hackathon
# ---------------------------------------------------------------------------


@app.get("/tasks")
def endpoint_list_tasks():
    """Return list of all 12 tasks and the action schema."""
    return {
        "tasks": list_all_tasks(),
        "action_schema": FarmAction.model_json_schema(),
    }


class GraderRequest(BaseModel):
    task_id: str
    final_state: Dict[str, Any] = {}
    episode_history: List[Dict[str, Any]] = []


@app.post("/grader")
def endpoint_grade(req: GraderRequest):
    """Grade a completed episode using task-specific grader."""
    try:
        task = get_task(req.task_id)
    except ValueError:
        raise HTTPException(status_code=404, detail=f"Unknown task_id: {req.task_id}")

    # Convert flat observation format to nested simulator state if needed
    state = req.final_state
    if "fish" not in state and "avg_fish_weight" in state:
        state = {
            "fish": {
                "weight_g": state.get("avg_fish_weight", 50),
                "population": state.get("population", 10000),
                "mortality_today": state.get("mortality_today", 0),
                "cumulative_mortality": state.get("cumulative_mortality", 0),
                "survival_rate": state.get("survival_rate", 1.0),
                "stress_level": state.get("stress_level", 0.0),
                "feeding_response": state.get("feeding_response", "normal"),
                "biomass_kg": state.get("biomass_kg", 0),
                "growth_rate_g_day": state.get("growth_rate_g_day", 0),
                "fcr": state.get("fcr", 0),
                "sgr": state.get("sgr", 0),
                "stocking_density": state.get("stocking_density", 0),
            },
            "water": {
                "temperature": state.get("temperature", 28),
                "DO": state.get("dissolved_oxygen", 7),
                "pH": state.get("ph", 7.5),
                "TAN": state.get("ammonia", 0.1),
                "UIA": state.get("ammonia_toxic", 0.005),
                "NO2": state.get("nitrite", 0.05),
                "NO3": state.get("nitrate", 5),
                "water_quality_score": state.get("water_quality_score", 0.9),
                "algae_bloom": state.get("algae_bloom", False),
                "nighttime_do_risk": state.get("nighttime_do_risk", 0),
            },
            "economics": {
                "fish_value": state.get("current_fish_value", 0),
                "total_cost": state.get("total_cost_so_far", 0),
                "current_profit": state.get("current_profit", 0),
                "feed_price_per_kg": state.get("feed_price_per_kg", 0.5),
                "market_price_multiplier": state.get("market_price_multiplier", 1.0),
                "feed_inventory_kg": state.get("feed_remaining_kg", 500),
                "cost_breakdown": {},
            },
            "disease": {
                "active": state.get("disease_suspected", False),
                "infected": 0,
                "recovered": 0,
            },
            "time": {
                "day": state.get("day_in_cycle", 0),
                "hour": state.get("time_of_day", 0),
                "day_of_year": state.get("day_of_year", 90),
            },
            "done": state.get("done", True),
            "harvested": state.get("harvested", False),
        }

    grader = FarmGrader()
    result = grader.grade(
        task_id=req.task_id,
        final_state=state,
        episode_history=req.episode_history,
        task_config=task,
    )
    return asdict(result)


class BaselineRequest(BaseModel):
    task_id: Optional[str] = None


@app.post("/baseline")
def endpoint_baseline(req: BaselineRequest):
    """Run a constant-action baseline agent on task(s) and return scores.

    This heuristic uses moderate feeding (0.4), moderate aeration (0.6),
    no heating, light water exchange — a reasonable but unoptimized strategy.
    """
    from ..engine.simulator import FishFarmSimulator

    grader = FarmGrader()
    task_ids = [req.task_id] if req.task_id else list(TASKS.keys())
    results = []

    for tid in task_ids:
        try:
            task = get_task(tid)
        except ValueError:
            raise HTTPException(status_code=404, detail=f"Unknown task_id: {tid}")

        # Run simulation with constant baseline action
        sim = FishFarmSimulator(seed=42)
        ic = task["initial_conditions"]
        sim.reset(
            initial_weight=ic["weight_g"],
            initial_population=ic["population"],
            initial_temp=ic["temp"],
            initial_DO=ic["DO"],
            initial_TAN=ic["TAN"],
            initial_pH=ic["pH"],
            day_of_year=ic["day_of_year"],
            base_air_temp=ic.get("base_air_temp", 30.0),
            seed=42,
            scheduled_events=task["events"][:] if task["events"] else None,
        )

        history = []
        max_hours = min(task["episode_hours"], 720)  # cap at 30 days for baseline speed

        for _ in range(max_hours):
            state = sim.step(
                feeding_rate=0.4,
                aeration_rate=0.6,
                heater_setting=0.0,
                water_exchange_rate=0.02,
                harvest=False,
                treatment="none",
            )
            history.append(state)
            if state["done"]:
                break

        grade_result = grader.grade(tid, state, history, task)

        results.append({
            "task_id": tid,
            "difficulty": task["difficulty"],
            "grader_score": grade_result.score,
            "grader_passed": grade_result.passed,
            "grader_feedback": grade_result.feedback,
            "hours_simulated": len(history),
        })

    return {
        "results": results,
        "total_tasks": len(results),
        "avg_grader_score": sum(r["grader_score"] for r in results) / len(results) if results else 0.0,
    }