Spaces:

omaryasserhassan
/

qwen-planner-api

Sleeping

omaryasserhassan commited on 24 days ago

Commit

92c55d8

verified ·

1 Parent(s): fcea2ac

Update Dockerfile

Files changed (1) hide show

Dockerfile CHANGED Viewed

@@ -1,20 +1,37 @@
 FROM python:3.11-slim
-# System deps for some wheels/builds
 RUN apt-get update && apt-get install -y --no-install-recommends \
     build-essential cmake git && \
     rm -rf /var/lib/apt/lists/*
 WORKDIR /app
-# Python deps
 COPY requirements.txt .
 RUN pip install --no-cache-dir -r requirements.txt
 # App code
 COPY app.py .
 EXPOSE 7860
-# Run FastAPI
 CMD ["uvicorn", "app:app", "--host", "0.0.0.0", "--port", "7860"]

 FROM python:3.11-slim
+# System deps for llama-cpp build
 RUN apt-get update && apt-get install -y --no-install-recommends \
     build-essential cmake git && \
     rm -rf /var/lib/apt/lists/*
 WORKDIR /app
+# App deps
 COPY requirements.txt .
 RUN pip install --no-cache-dir -r requirements.txt
+# --- Bake model into the image (change these ENV if you prefer Phi-3 mini) ---
+ENV MODEL_REPO=Qwen/Qwen2.5-3B-Instruct-GGUF
+ENV MODEL_FILE=qwen2.5-3b-instruct-q4_k_m.gguf
+# Download GGUF at build time to /app/models (no symlinks)
+RUN python - <<'PY'
+from huggingface_hub import snapshot_download
+import os
+local_dir = "/app/models"
+os.makedirs(local_dir, exist_ok=True)
+snapshot_download(
+    repo_id=os.environ.get("MODEL_REPO"),
+    allow_patterns=[os.environ.get("MODEL_FILE")],
+    local_dir=local_dir,
+    local_dir_use_symlinks=False,
+)
+print("Model baked into image at /app/models")
+PY
 # App code
 COPY app.py .
 EXPOSE 7860
 CMD ["uvicorn", "app:app", "--host", "0.0.0.0", "--port", "7860"]