Update Dockerfile
Browse files- Dockerfile +12 -5
Dockerfile
CHANGED
|
@@ -1,10 +1,11 @@
|
|
|
|
|
| 1 |
FROM python:3.11-slim
|
| 2 |
|
| 3 |
# INSTALA DEPENDÊNCIAS DO SISTEMA
|
| 4 |
RUN apt-get update && \
|
| 5 |
apt-get install -y --no-install-recommends \
|
| 6 |
-
|
| 7 |
-
|
| 8 |
&& rm -rf /var/lib/apt/lists/*
|
| 9 |
|
| 10 |
# BAIXA E INSTALA OLLAMA
|
|
@@ -24,16 +25,22 @@ RUN pip install --no-cache-dir -r requirements.txt
|
|
| 24 |
EXPOSE 7860
|
| 25 |
EXPOSE 11434
|
| 26 |
|
| 27 |
-
# PUXA MODELO
|
| 28 |
RUN ollama serve & \
|
| 29 |
OLLAMA_PID=$! && \
|
| 30 |
-
sleep
|
| 31 |
-
ollama pull qwen2.5:
|
| 32 |
kill $OLLAMA_PID || true
|
| 33 |
|
| 34 |
# HEALTHCHECK
|
| 35 |
HEALTHCHECK --interval=30s --timeout=10s --start-period=60s --retries=3 \
|
| 36 |
CMD curl -f http://localhost:7860/health || exit 1
|
| 37 |
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 38 |
# INICIA app.py
|
| 39 |
CMD ["python", "app.py"]
|
|
|
|
| 1 |
+
# Dockerfile
|
| 2 |
FROM python:3.11-slim
|
| 3 |
|
| 4 |
# INSTALA DEPENDÊNCIAS DO SISTEMA
|
| 5 |
RUN apt-get update && \
|
| 6 |
apt-get install -y --no-install-recommends \
|
| 7 |
+
curl \
|
| 8 |
+
ca-certificates \
|
| 9 |
&& rm -rf /var/lib/apt/lists/*
|
| 10 |
|
| 11 |
# BAIXA E INSTALA OLLAMA
|
|
|
|
| 25 |
EXPOSE 7860
|
| 26 |
EXPOSE 11434
|
| 27 |
|
| 28 |
+
# === PUXA MODELO LEVE + QUANTIZADO DURANTE BUILD ===
|
| 29 |
RUN ollama serve & \
|
| 30 |
OLLAMA_PID=$! && \
|
| 31 |
+
sleep 20 && \
|
| 32 |
+
ollama pull qwen2.5:3b-q4_0 && \
|
| 33 |
kill $OLLAMA_PID || true
|
| 34 |
|
| 35 |
# HEALTHCHECK
|
| 36 |
HEALTHCHECK --interval=30s --timeout=10s --start-period=60s --retries=3 \
|
| 37 |
CMD curl -f http://localhost:7860/health || exit 1
|
| 38 |
|
| 39 |
+
# VARIÁVEIS DE AMBIENTE (OTIMIZAÇÃO)
|
| 40 |
+
ENV OLLAMA_NUM_PARALLEL=3
|
| 41 |
+
ENV OLLAMA_MAX_QUEUE=10
|
| 42 |
+
ENV OLLAMA_KEEP_ALIVE=10m
|
| 43 |
+
ENV OLLAMA_MAX_LOADED_MODELS=1
|
| 44 |
+
|
| 45 |
# INICIA app.py
|
| 46 |
CMD ["python", "app.py"]
|