Spaces:

Dnfs
/

llm-apiku

Build error

Dnfs commited on Jul 5

Commit

e4c3b29

verified ·

1 Parent(s): 067ca1c

Update Dockerfile

Files changed (1) hide show

Dockerfile CHANGED Viewed

@@ -2,8 +2,6 @@
 FROM python:3.10-slim
 # 2. Install system dependencies REQUIRED FOR COMPILING llama-cpp-python
-# This is the key fix for the build error.
-# We run this as root before switching to the non-root user.
 RUN apt-get update && apt-get install -y \
     build-essential \
     cmake \
@@ -21,24 +19,27 @@ WORKDIR $HOME/app
 # 5. Copy requirements first for better Docker layer caching
 COPY --chown=user requirements.txt .
-# 6. Install Python dependencies for the non-root user
-# This will now succeed because the build tools are available.
 RUN pip install --no-cache-dir --user -r requirements.txt
-# 7. Download the model during the build process
 RUN huggingface-cli download Dnfs/gema-4b-indra10k-model1-Q4_K_M-GGUF \
     --local-dir ./model \
     --local-dir-use-symlinks False
-# 8. Copy the rest of the application code
 COPY --chown=user app.py .
-# 9. Expose the port the app runs on
 EXPOSE 8000
-# 10. Health check to ensure the app is running
 HEALTHCHECK --interval=30s --timeout=10s --start-period=5s --retries=3 \
   CMD curl -f http://localhost:8000/health || exit 1
-# 11. Command to run the application
 CMD ["python", "app.py"]

 FROM python:3.10-slim
 # 2. Install system dependencies REQUIRED FOR COMPILING llama-cpp-python
 RUN apt-get update && apt-get install -y \
     build-essential \
     cmake \
 # 5. Copy requirements first for better Docker layer caching
 COPY --chown=user requirements.txt .
+# 6. Set build arguments to speed up llama-cpp-python installation
+# This is the key fix for the timeout error. It disables GPU support checks.
+ENV CMAKE_ARGS="-DLLAMA_CUBLAS=OFF -DLLAMA_METAL=OFF"
+# 7. Install Python dependencies for the non-root user
 RUN pip install --no-cache-dir --user -r requirements.txt
+# 8. Download the model during the build process
 RUN huggingface-cli download Dnfs/gema-4b-indra10k-model1-Q4_K_M-GGUF \
     --local-dir ./model \
     --local-dir-use-symlinks False
+# 9. Copy the rest of the application code
 COPY --chown=user app.py .
+# 10. Expose the port the app runs on
 EXPOSE 8000
+# 11. Health check to ensure the app is running
 HEALTHCHECK --interval=30s --timeout=10s --start-period=5s --retries=3 \
   CMD curl -f http://localhost:8000/health || exit 1
+# 12. Command to run the application
 CMD ["python", "app.py"]