Spaces:

KoboldAI
/

Koboldcpp-Tiefighter

Running on T4

concedo commited on Jun 6, 2024

Commit

1c97e32

verified ·

1 Parent(s): 541084a

Add whisper launch args

Files changed (1) hide show

Dockerfile CHANGED Viewed

@@ -1,6 +1,7 @@
 FROM nvidia/cuda:12.1.1-devel-ubuntu22.04
 ARG MODEL
 ARG IMGMODEL
 ARG MMPROJ
 ARG MODEL_NAME
 ARG ADDITIONAL
@@ -13,5 +14,6 @@ RUN make -j$(nproc) LLAMA_OPENBLAS=1 LLAMA_CUBLAS=1 LLAMA_PORTABLE=1 LLAMA_COLAB
 RUN wget -O model.ggml $MODEL || true
 RUN wget -O imgmodel.ggml $IMGMODEL || true
 RUN wget -O mmproj.ggml $MMPROJ || true
-CMD /bin/python3 ./koboldcpp.py --model model.ggml --sdmodel imgmodel.ggml --sdthreads 4 --sdquant --sdclamped --mmproj mmproj.ggml $ADDITIONAL --port 7860 --hordeconfig $MODEL_NAME 1 1 --preloadstory default.json --ignoremissing

 FROM nvidia/cuda:12.1.1-devel-ubuntu22.04
 ARG MODEL
 ARG IMGMODEL
+ARG WHISPERMODEL
 ARG MMPROJ
 ARG MODEL_NAME
 ARG ADDITIONAL
 RUN wget -O model.ggml $MODEL || true
 RUN wget -O imgmodel.ggml $IMGMODEL || true
 RUN wget -O mmproj.ggml $MMPROJ || true
+RUN wget -O whispermodel.ggml $WHISPERMODEL || true
+CMD /bin/python3 ./koboldcpp.py --model model.ggml --whispermodel whispermodel.ggml --sdmodel imgmodel.ggml --sdthreads 4 --sdquant --sdclamped --mmproj mmproj.ggml $ADDITIONAL --port 7860 --hordemodelname $MODEL_NAME --hordemaxctx 1 --hordegenlen 1 --preloadstory default.json --ignoremissing