demo-llm / Dockerfile
Petro
3
273463a
raw
history blame
421 Bytes
FROM python:3.9
RUN wget -q zephyr-7b-beta.Q4_K_S.gguf https://huggingface.co/TheBloke/zephyr-7B-beta-GGUF/resolve/main/zephyr-7b-beta.Q4_K_S.gguf
COPY requirements.txt ./requirements.txt
RUN python -m pip install -U pip && \
python -m pip install -r requirements.txt && \
python -m pip cache purge
COPY ./main.py /code/main.py
WORKDIR /code
CMD ["uvicorn", "main:app", "--host", "0.0.0.0", "--port", "7860"]