Spaces:
Running on A100
Running on A100
File size: 1,060 Bytes
8595613 b1245ea 8595613 b1245ea 8595613 b1245ea 8595613 b1245ea 8595613 b1245ea 8595613 b1245ea 8595613 c19e50b | 1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 | FROM vllm/vllm-openai:latest
ENV DEBIAN_FRONTEND=noninteractive
ENV PYTHONUNBUFFERED=1
ENV MODEL_NAME=NM-dev/NuExtract3.4_4B-RL-400
ENV OPENAI_API_BASE=http://127.0.0.1:8000/v1
ENV OPENAI_API_KEY=EMPTY
ENV GRADIO_SERVER_NAME=0.0.0.0
ENV GRADIO_SERVER_PORT=7860
ENV VLLM_PORT=8000
ENV MAX_MODEL_LEN=8192
ENV GPU_MEMORY_UTILIZATION=0.90
ENV NUEXTRACT_MAX_TOKENS=5000
ENV NUEXTRACT_ASSETS_DIR=/home/user/app/assets
ENV HF_HOME=/data/.cache/huggingface
ENV TRANSFORMERS_CACHE=/data/.cache/huggingface
ENV VLLM_CACHE_ROOT=/data/.cache/vllm
RUN pip install --no-cache-dir \
gradio \
openai \
pillow
RUN useradd -m -u 1000 user || true
WORKDIR /home/user/app
COPY --chown=user:user app.py /home/user/app/app.py
COPY --chown=user:user start.sh /home/user/app/start.sh
COPY --chown=user:user assets /home/user/app/assets
RUN chown -R user:user /home/user/app && \
chmod +x /home/user/app/start.sh
USER user
EXPOSE 7860
# Important: override vllm/vllm-openai's default entrypoint.
ENTRYPOINT []
CMD ["/bin/bash", "/home/user/app/start.sh"] |