ndc8
Update Dockerfile and application entry point for GGUF backend; optimize memory usage in model parameters and requirements
358e717
# Use Python 3.10 slim image | |
FROM python:3.10-slim | |
# Set up a new user named "user" with user ID 1000 (required by HF Spaces) | |
RUN useradd -m -u 1000 user | |
# Switch to the "user" user | |
USER user | |
# Set home to the user's home directory | |
ENV HOME=/home/user \ | |
PATH=/home/user/.local/bin:$PATH \ | |
HF_HOME=/tmp/.cache/huggingface \ | |
TRANSFORMERS_NO_ADVISORY_WARNINGS=1 | |
# Set the working directory to the user's home directory | |
WORKDIR $HOME/app | |
# Copy requirements and install dependencies | |
COPY --chown=user requirements.txt . | |
RUN pip install --no-cache-dir --upgrade pip && \ | |
pip install --no-cache-dir -r requirements.txt | |
# Copy the application code | |
COPY --chown=user . . | |
# Expose port 7860 (HF Spaces default) | |
EXPOSE 7860 | |
# Command to run the GGUF backend application | |
CMD ["python", "-m", "uvicorn", "app:app", "--host", "0.0.0.0", "--port", "7860"] | |