File size: 1,060 Bytes
8595613
 
 
 
b1245ea
8595613
 
 
b1245ea
8595613
 
b1245ea
8595613
 
 
b1245ea
8595613
 
b1245ea
8595613
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
b1245ea
8595613
 
 
 
 
 
c19e50b
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
FROM vllm/vllm-openai:latest

ENV DEBIAN_FRONTEND=noninteractive
ENV PYTHONUNBUFFERED=1

ENV MODEL_NAME=NM-dev/NuExtract3.4_4B-RL-400
ENV OPENAI_API_BASE=http://127.0.0.1:8000/v1
ENV OPENAI_API_KEY=EMPTY

ENV GRADIO_SERVER_NAME=0.0.0.0
ENV GRADIO_SERVER_PORT=7860

ENV VLLM_PORT=8000
ENV MAX_MODEL_LEN=8192
ENV GPU_MEMORY_UTILIZATION=0.90

ENV NUEXTRACT_MAX_TOKENS=5000
ENV NUEXTRACT_ASSETS_DIR=/home/user/app/assets

ENV HF_HOME=/data/.cache/huggingface
ENV TRANSFORMERS_CACHE=/data/.cache/huggingface
ENV VLLM_CACHE_ROOT=/data/.cache/vllm

RUN pip install --no-cache-dir \
    gradio \
    openai \
    pillow

RUN useradd -m -u 1000 user || true

WORKDIR /home/user/app

COPY --chown=user:user app.py /home/user/app/app.py
COPY --chown=user:user start.sh /home/user/app/start.sh
COPY --chown=user:user assets /home/user/app/assets

RUN chown -R user:user /home/user/app && \
    chmod +x /home/user/app/start.sh

USER user

EXPOSE 7860

# Important: override vllm/vllm-openai's default entrypoint.
ENTRYPOINT []

CMD ["/bin/bash", "/home/user/app/start.sh"]