docker_selfhosted / Dockerfile
Leon4gr45's picture
Update Dockerfile
cdc816f verified
raw
history blame
1.04 kB
# Use a standard base image with CUDA support
FROM pytorch/pytorch:2.3.0-cuda12.1-cudnn8-runtime
# Set environment variables for caching AND for CUDA libraries
ENV DEBIAN_FRONTEND=noninteractive
ENV HF_HOME="/data/huggingface"
ENV UV_CACHE_DIR="/data/uv_cache"
# --- THE CRITICAL FIX ---
# Tell the dynamic linker where to find the NVIDIA CUDA libraries.
# This makes `libcuda.so.1` visible to vLLM.
ENV LD_LIBRARY_PATH=/usr/local/nvidia/lib64:$LD_LIBRARY_PATH
# Install git and uv (for faster package installation)
RUN apt-get update && apt-get install -y --no-install-recommends git && rm -rf /var/lib/apt/lists/*
RUN pip install uv
# Copy requirements and install them efficiently into the system environment
COPY requirements.txt .
RUN uv pip install --no-cache --system -r requirements.txt
# Copy the application code into the container
COPY ./app.py /app/app.py
WORKDIR /app
# Expose the port the app will run on
EXPOSE 7860
# The command to run the FastAPI app
CMD ["uvicorn", "app:app", "--host", "0.0.0.0", "--port", "7860"]