madDegen commited on
Commit
e63b1dc
·
verified ·
1 Parent(s): e1fc079

consolidate: HQ Dockerfile — Ollama + FastAPI orchestrator

Browse files
Files changed (1) hide show
  1. hq/Dockerfile +25 -0
hq/Dockerfile ADDED
@@ -0,0 +1,25 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ FROM python:3.11-slim
2
+
3
+ # Install Ollama
4
+ RUN apt-get update && apt-get install -y curl && \
5
+ curl -fsSL https://ollama.com/install.sh | sh && \
6
+ apt-get clean
7
+
8
+ WORKDIR /app
9
+ COPY requirements.txt .
10
+ RUN pip install --no-cache-dir -r requirements.txt
11
+
12
+ COPY . .
13
+
14
+ ENV OLLAMA_MAX_LOADED_MODELS=2
15
+ ENV COMPUTE_STRATEGY=round_robin
16
+ ENV PORT=8000
17
+
18
+ EXPOSE 8000 11434
19
+
20
+ # Pull both models then start orchestrator
21
+ CMD bash -c "\
22
+ ollama serve & sleep 5 && \
23
+ ollama pull ${REASONER_MODEL:-gemma4:e4b-instruct-q4_K_M} && \
24
+ ollama pull ${CODER_MODEL:-qwen3.5:4b-instruct-q4_K_M} && \
25
+ python orchestrator.py"