docker_selfhosted / Dockerfile
Leon4gr45's picture
Create Dockerfile
4a15a33 verified
raw
history blame
853 Bytes
# Use a standard base image with CUDA support
FROM pytorch/pytorch:2.3.0-cuda12.1-cudnn8-runtime
# Set environment variables for caching
ENV DEBIAN_FRONTEND=noninteractive
ENV HF_HOME="/data/huggingface"
ENV UV_CACHE_DIR="/data/uv_cache"
# Install git and uv (for faster package installation)
RUN apt-get update && apt-get install -y --no-install-recommends git && rm -rf /var/lib/apt/lists/*
RUN pip install uv
# Copy requirements and install them efficiently
COPY requirements.txt .
RUN uv pip install --no-cache -r requirements.txt
# Copy the application code into the container
COPY ./app.py /app/app.py
WORKDIR /app
# Expose the port the app will run on
EXPOSE 7860
# THE CRITICAL COMMAND: This tells the container how to run your FastAPI app.
# The Gradio SDK cannot do this.
CMD ["uvicorn", "app:app", "--host", "0.0.0.0", "--port", "7860"]