Update Dockerfile
Browse files- Dockerfile +19 -5
Dockerfile
CHANGED
@@ -25,10 +25,24 @@ COPY --chown=user . /app
|
|
25 |
RUN pip install --no-cache-dir \
|
26 |
torch==2.3.1+cu121 torchaudio==2.3.1 \
|
27 |
--index-url https://download.pytorch.org/whl/cu121
|
28 |
-
|
29 |
-
RUN pip install text-generation==0.6.1
|
30 |
-
ENV ORPHEUS_API_URL=http://127.0.0.1:1234/v1/completions
|
31 |
EXPOSE 7860
|
32 |
-
|
33 |
-
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
34 |
|
|
|
25 |
RUN pip install --no-cache-dir \
|
26 |
torch==2.3.1+cu121 torchaudio==2.3.1 \
|
27 |
--index-url https://download.pytorch.org/whl/cu121
|
28 |
+
|
|
|
|
|
29 |
EXPOSE 7860
|
30 |
+
|
31 |
+
RUN pip install --no-cache-dir text-generation==0.6.1
|
32 |
+
|
33 |
+
ENV HF_HOME=/app/.cache
|
34 |
+
ENV MODEL_ID="SebastianBodza/Kartoffel_Orpheus-3B_german_natural-v0.1"
|
35 |
+
ENV ORPHEUS_API_URL=http://127.0.0.1:1234/v1/completions
|
36 |
+
ENV ORPHEUS_MODEL=$MODEL_ID # landet im JSON-Payload von OrpheusEngine
|
37 |
+
|
38 |
+
CMD bash -c "\
|
39 |
+
text-generation-launcher \
|
40 |
+
--model-id $MODEL_ID \
|
41 |
+
--port 1234 \
|
42 |
+
--max-input-length 4096 \
|
43 |
+
--dtype auto \
|
44 |
+
--quantization fp8 \
|
45 |
+
--enable-chunked-prefill \
|
46 |
+
--gpu-memory-utilization 0.7 & \
|
47 |
+
uvicorn app:app --host 0.0.0.0 --port 7860"
|
48 |
|