Tomtom84 commited on
Commit
8fc2ed8
·
verified ·
1 Parent(s): 56c49c7

Update Dockerfile

Browse files
Files changed (1) hide show
  1. Dockerfile +19 -5
Dockerfile CHANGED
@@ -25,10 +25,24 @@ COPY --chown=user . /app
25
  RUN pip install --no-cache-dir \
26
  torch==2.3.1+cu121 torchaudio==2.3.1 \
27
  --index-url https://download.pytorch.org/whl/cu121
28
-
29
- RUN pip install text-generation==0.6.1
30
- ENV ORPHEUS_API_URL=http://127.0.0.1:1234/v1/completions
31
  EXPOSE 7860
32
- CMD bash -c "text-generation-launcher --model-id SebastianBodza/Kartoffel_Orpheus-3B_german_natural-v0.1 --port 1234 & \
33
- uvicorn app:app --host 0.0.0.0 --port 7860"
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
34
 
 
25
  RUN pip install --no-cache-dir \
26
  torch==2.3.1+cu121 torchaudio==2.3.1 \
27
  --index-url https://download.pytorch.org/whl/cu121
28
+
 
 
29
  EXPOSE 7860
30
+
31
+ RUN pip install --no-cache-dir text-generation==0.6.1
32
+
33
+ ENV HF_HOME=/app/.cache
34
+ ENV MODEL_ID="SebastianBodza/Kartoffel_Orpheus-3B_german_natural-v0.1"
35
+ ENV ORPHEUS_API_URL=http://127.0.0.1:1234/v1/completions
36
+ ENV ORPHEUS_MODEL=$MODEL_ID # landet im JSON-Payload von OrpheusEngine
37
+
38
+ CMD bash -c "\
39
+ text-generation-launcher \
40
+ --model-id $MODEL_ID \
41
+ --port 1234 \
42
+ --max-input-length 4096 \
43
+ --dtype auto \
44
+ --quantization fp8 \
45
+ --enable-chunked-prefill \
46
+ --gpu-memory-utilization 0.7 & \
47
+ uvicorn app:app --host 0.0.0.0 --port 7860"
48