Update Dockerfile
Browse files- Dockerfile +7 -8
Dockerfile
CHANGED
@@ -50,12 +50,11 @@ ENV ORPHEUS_API_URL=http://127.0.0.1:1234/v1/completions
|
|
50 |
|
51 |
# βββββ Entrypoint ββββββββββββββββββββββββββββββββββββββββ
|
52 |
CMD bash -c "\
|
53 |
-
|
54 |
-
|
55 |
-
|
56 |
-
|
57 |
-
|
58 |
-
|
59 |
-
|
60 |
-
|
61 |
|
|
|
50 |
|
51 |
# βββββ Entrypoint ββββββββββββββββββββββββββββββββββββββββ
|
52 |
CMD bash -c "\
|
53 |
+
python -m vllm.entrypoints.openai.api_server \
|
54 |
+
--model ${MODEL_ID} \
|
55 |
+
--port 1234 \
|
56 |
+
--dtype bfloat16 \
|
57 |
+
--gpu-memory-utilization 0.9 \
|
58 |
+
--max-model-len 8192 & # β im Hintergrund starten
|
59 |
+
exec uvicorn app:app --host 0.0.0.0 --port 7860"
|
|
|
60 |
|