File size: 549 Bytes
092a975
 
 
 
 
 
 
 
0c78dfd
faa4e2e
2da0c5f
092a975
 
 
 
8ae6c69
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
FROM python:3.12

RUN useradd -m -u 1000 app

WORKDIR /home/app

RUN apt update
RUN apt install -y wget make cmake clang git g++
RUN wget https://huggingface.co/mradermacher/bellman-mistral-7b-instruct-v0.3-GGUF/blob/main/bellman-mistral-7b-instruct-v0.3.Q5_K_M.gguf?download=true -O model.gguf
ADD https://github.com/ggerganov/llama.cpp/releases/download/b4502/llama-b4502-bin-ubuntu-x64.zip .
RUN ls -l .
RUN apt install socat -y

EXPOSE 7860

CMD ["sh", "-c", "./build/bin/llama-server -m /home/app/model.gguf -c 8192 --host 0.0.0.0 --port 7860"]