# Copyright (c) Meta Platforms, Inc. and affiliates. # All rights reserved. # # This source code is licensed under the BSD-style license found in the # LICENSE file in the root directory of this source tree. """ FastAPI application for the Axiomforgeai Environment. This module creates an HTTP server that exposes the AxiomforgeaiEnvironment over HTTP and WebSocket endpoints, compatible with EnvClient. Endpoints: - POST /reset: Reset the environment - POST /step: Execute an action - GET /state: Get current environment state - GET /schema: Get action/observation schemas - WS /ws: WebSocket endpoint for persistent sessions Usage: # Development (with auto-reload): uvicorn server.app:app --reload --host 0.0.0.0 --port 8000 # Production: uvicorn server.app:app --host 0.0.0.0 --port 8000 --workers 4 # Or run directly: python -m server.app """ from fastapi import Request from fastapi.responses import HTMLResponse try: from openenv.core.env_server.http_server import create_app except Exception as e: # pragma: no cover raise ImportError( "openenv is required for the web interface. Install dependencies with '\n uv sync\n'" ) from e try: from ..models import AxiomforgeaiAction, AxiomforgeaiObservation from .AxiomForgeAI_environment import AxiomforgeaiEnvironment except ImportError: from models import AxiomforgeaiAction, AxiomforgeaiObservation from server.AxiomForgeAI_environment import AxiomforgeaiEnvironment # Create the app with web interface and README integration app = create_app( AxiomforgeaiEnvironment, AxiomforgeaiAction, AxiomforgeaiObservation, env_name="AxiomForgeAI", max_concurrent_envs=1, # increase this number to allow more concurrent WebSocket sessions ) _HOMEPAGE_HTML = """
A self-improving math RL environment. The model practices on verified problems, generates new challenges when ready, and learns from solution attempts whose reasoning steps and final answers agree.
Start a new episode. Returns a math question with topic and difficulty metadata.
Submit a solution for the current question. Returns reward, feedback, and scoring breakdown.
Get the current episode state including episode ID and step count.
Returns JSON schemas for action and observation types.
Health check endpoint. Returns server status and environment availability.
WebSocket endpoint for persistent sessions. Supports concurrent multi-agent connections.