| |
| FROM python:3.11-slim AS builder |
|
|
| ENV PYTHONDONTWRITEBYTECODE=1 |
| ENV PYTHONUNBUFFERED=1 |
| ENV PIP_DISABLE_PIP_VERSION_CHECK=1 |
|
|
| WORKDIR /app |
|
|
| COPY pyproject.toml README.md openenv.yaml ./ |
|
|
| COPY llmserve_env ./llmserve_env |
| COPY server ./server |
| COPY agents ./agents |
| COPY rl ./rl |
| COPY data ./data |
| COPY weights ./weights |
| COPY inference.py evaluate.py train.py ./ |
|
|
| RUN --mount=type=cache,target=/root/.cache/pip \ |
| python -m pip install --upgrade pip setuptools wheel && \ |
| printf 'torch==2.5.1+cpu\n' > /tmp/constraints.txt && \ |
| python -m pip install --prefix=/install \ |
| --extra-index-url https://download.pytorch.org/whl/cpu \ |
| -c /tmp/constraints.txt . |
|
|
| FROM python:3.11-slim |
|
|
| ENV PYTHONDONTWRITEBYTECODE=1 |
| ENV PYTHONUNBUFFERED=1 |
| ENV ENABLE_WEB_INTERFACE=true |
|
|
| WORKDIR /app |
|
|
| COPY --from=builder /install /usr/local |
| COPY pyproject.toml README.md openenv.yaml ./ |
| COPY llmserve_env ./llmserve_env |
| COPY server ./server |
| COPY agents ./agents |
| COPY rl ./rl |
| COPY data ./data |
| COPY weights ./weights |
| COPY inference.py evaluate.py train.py ./ |
|
|
| EXPOSE 7860 |
|
|
| HEALTHCHECK --interval=30s --timeout=5s --start-period=15s --retries=3 \ |
| CMD python -c "import urllib.request; urllib.request.urlopen('http://127.0.0.1:7860/health', timeout=5)" || exit 1 |
|
|
| CMD ["uvicorn", "server.app:app", "--host", "0.0.0.0", "--port", "7860", "--workers", "1"] |
|
|