Spaces:

rapacious
/

LLaMA_Server

Paused

rapacious commited on Mar 8

Commit

54dbd2f

verified ·

1 Parent(s): 0aa159f

Update Dockerfile

Files changed (1) hide show

Dockerfile CHANGED Viewed

@@ -1,21 +1,23 @@
-# Chọn image cơ bản (có CUDA nếu cần GPU)
 FROM ubuntu:22.04
-# Cài đặt các thư viện cần thiết
 RUN apt-get update && apt-get install -y \
     unzip wget curl python3 python3-pip
-# Sao chép file binary đã build vào container
 COPY llama_bin.zip /app/llama_bin.zip
 WORKDIR /app
 # Giải nén binaries
 RUN unzip llama_bin.zip && rm llama_bin.zip && chmod +x bin/server
-# Sao chép model (hoặc tải nếu cần)
-COPY models /models
-# Hoặc tải nếu mô hình chưa có
-# RUN wget -O /models/llama-7b.gguf https://huggingface.co/TheBloke/Llama-2-7B-GGUF/resolve/main/llama-2-7b.Q4_K_M.gguf
-# Chạy server
-CMD ["./bin/server", "-m", "/models/llama-7b.gguf", "-p", "8000"]

+# Chọn image cơ bản
 FROM ubuntu:22.04
+# Cài đặt thư viện cần thiết
 RUN apt-get update && apt-get install -y \
     unzip wget curl python3 python3-pip
+# Sao chép binary LLaMA đã build vào container
 COPY llama_bin.zip /app/llama_bin.zip
 WORKDIR /app
 # Giải nén binaries
 RUN unzip llama_bin.zip && rm llama_bin.zip && chmod +x bin/server
+# Tạo thư mục models
+RUN mkdir -p /models
+# Tải mô hình Qwen2.5-0.5B-Instruct-GGUF
+RUN wget -O /models/qwen2.5-0.5b-instruct-q5_k_m.gguf \
+    https://huggingface.co/Qwen/Qwen2.5-0.5B-Instruct-GGUF/resolve/main/qwen2.5-0.5b-instruct-q5_k_m.gguf
+# Chạy server với mô hình Qwen
+CMD ["./bin/server", "-m", "/models/qwen2.5-0.5b-instruct-q5_k_m.gguf", "-p", "8000"]