|
FROM nvidia/cuda:12.8.1-base-ubuntu22.04 AS base |
|
|
|
ARG DEBIAN_FRONTEND=noninteractive |
|
|
|
RUN apt-get update && apt-get install -y \ |
|
python3.10 python3-pip openmpi-bin libopenmpi-dev git git-lfs wget \ |
|
&& apt install python-is-python3 \ |
|
&& pip install --upgrade pip setuptools \ |
|
&& rm -rf /var/lib/apt/lists/* |
|
|
|
FROM base AS devel |
|
RUN pip install --no-cache-dir -U tensorrt_llm==0.18.2 --extra-index-url https://pypi.nvidia.com |
|
WORKDIR /app |
|
RUN git clone -b v0.18.2 https://github.com/NVIDIA/TensorRT-LLM.git \ |
|
&& mv TensorRT-LLM/examples ./TensorRT-LLM-examples \ |
|
&& rm -rf TensorRT-LLM |
|
|
|
FROM devel AS release |
|
WORKDIR /app |
|
COPY assets/ ./assets |
|
RUN wget -nc -P assets/ https://raw.githubusercontent.com/openai/whisper/main/whisper/assets/mel_filters.npz |
|
|
|
COPY scripts/setup.sh ./ |
|
RUN apt update && bash setup.sh && rm setup.sh |
|
|
|
COPY requirements/server.txt . |
|
RUN pip install --no-cache-dir -r server.txt && rm server.txt |
|
COPY whisper_live ./whisper_live |
|
COPY scripts/build_whisper_tensorrt.sh . |
|
COPY run_server.py . |