File size: 1,379 Bytes
4fbc241 4645de0 4fbc241 4645de0 4fbc241 4645de0 4fbc241 4645de0 4fbc241 | 1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 | # syntax=docker/dockerfile:1.7
FROM python:3.11-slim AS builder
ENV PYTHONDONTWRITEBYTECODE=1
ENV PYTHONUNBUFFERED=1
ENV PIP_DISABLE_PIP_VERSION_CHECK=1
WORKDIR /app
COPY pyproject.toml README.md openenv.yaml ./
COPY llmserve_env ./llmserve_env
COPY server ./server
COPY agents ./agents
COPY rl ./rl
COPY data ./data
COPY weights ./weights
COPY inference.py evaluate.py train.py ./
RUN --mount=type=cache,target=/root/.cache/pip \
python -m pip install --upgrade pip setuptools wheel && \
printf 'torch==2.5.1+cpu\n' > /tmp/constraints.txt && \
python -m pip install --prefix=/install \
--extra-index-url https://download.pytorch.org/whl/cpu \
-c /tmp/constraints.txt .
FROM python:3.11-slim
ENV PYTHONDONTWRITEBYTECODE=1
ENV PYTHONUNBUFFERED=1
ENV ENABLE_WEB_INTERFACE=true
WORKDIR /app
COPY --from=builder /install /usr/local
COPY pyproject.toml README.md openenv.yaml ./
COPY llmserve_env ./llmserve_env
COPY server ./server
COPY agents ./agents
COPY rl ./rl
COPY data ./data
COPY weights ./weights
COPY inference.py evaluate.py train.py ./
EXPOSE 7860
HEALTHCHECK --interval=30s --timeout=5s --start-period=15s --retries=3 \
CMD python -c "import urllib.request; urllib.request.urlopen('http://127.0.0.1:7860/health', timeout=5)" || exit 1
CMD ["uvicorn", "server.app:app", "--host", "0.0.0.0", "--port", "7860", "--workers", "1"]
|