Spaces:
Runtime error
Runtime error
# Use a standard base image with CUDA support | |
FROM pytorch/pytorch:2.3.0-cuda12.1-cudnn8-runtime | |
# Set environment variables for caching AND for CUDA libraries | |
ENV DEBIAN_FRONTEND=noninteractive | |
ENV HF_HOME="/data/huggingface" | |
ENV UV_CACHE_DIR="/data/uv_cache" | |
# --- THE CRITICAL FIX --- | |
# Tell the dynamic linker where to find the NVIDIA CUDA libraries. | |
# This makes `libcuda.so.1` visible to vLLM. | |
ENV LD_LIBRARY_PATH=/usr/local/nvidia/lib64:$LD_LIBRARY_PATH | |
# Install git and uv (for faster package installation) | |
RUN apt-get update && apt-get install -y --no-install-recommends git && rm -rf /var/lib/apt/lists/* | |
RUN pip install uv | |
# Copy requirements and install them efficiently into the system environment | |
COPY requirements.txt . | |
RUN uv pip install --no-cache --system -r requirements.txt | |
# Copy the application code into the container | |
COPY ./app.py /app/app.py | |
WORKDIR /app | |
# Expose the port the app will run on | |
EXPOSE 7860 | |
# The command to run the FastAPI app | |
CMD ["uvicorn", "app:app", "--host", "0.0.0.0", "--port", "7860"] |