ffreemt commited on
Commit
2c7ae2c
·
1 Parent(s): fab6488

--cpu-strict -np 2

Browse files
Files changed (2) hide show
  1. Dockerfile +3 -2
  2. README.md +1 -1
Dockerfile CHANGED
@@ -4,7 +4,7 @@ FROM ghcr.io/ggml-org/llama.cpp:server
4
  WORKDIR /app
5
 
6
  RUN apt update && apt install -y python3 python3-pip python3-venv pipx
7
- ENV PATH="/root/.local/bin:$PATH"
8
 
9
  # RUN pip install huggingface_hub --break-system-packages
10
  RUN pipx install huggingface_hub
@@ -13,10 +13,11 @@ RUN pipx install huggingface_hub
13
  RUN hf download prism-ml/Bonsai-8B-gguf Bonsai-8B.gguf --local-dir /app
14
  RUN mv /app/Bonsai-8B.gguf /app/bonsai-8b
15
 
16
- #MD ["--server", \
17
  CMD ["--model", "/app/bonsai-8b", \
18
  "--host", "0.0.0.0", \
19
  "--port", "7860", \
 
20
  "-t", "2", \
21
  "--cache-type-k", "q8_0", \
22
  "--cache-type-v", "iq4_nl", \
 
4
  WORKDIR /app
5
 
6
  RUN apt update && apt install -y python3 python3-pip python3-venv pipx
7
+ ENV PATH=/root/.local/bin:$PATH
8
 
9
  # RUN pip install huggingface_hub --break-system-packages
10
  RUN pipx install huggingface_hub
 
13
  RUN hf download prism-ml/Bonsai-8B-gguf Bonsai-8B.gguf --local-dir /app
14
  RUN mv /app/Bonsai-8B.gguf /app/bonsai-8b
15
 
16
+ # CMD ["--server", \
17
  CMD ["--model", "/app/bonsai-8b", \
18
  "--host", "0.0.0.0", \
19
  "--port", "7860", \
20
+ "--cpu-strict", "-np", "2" \
21
  "-t", "2", \
22
  "--cache-type-k", "q8_0", \
23
  "--cache-type-v", "iq4_nl", \
README.md CHANGED
@@ -1,5 +1,5 @@
1
  ---
2
- title: bonsai-b
3
  emoji: 💻
4
  colorFrom: purple
5
  colorTo: blue
 
1
  ---
2
+ title: bonsai-8b
3
  emoji: 💻
4
  colorFrom: purple
5
  colorTo: blue