Spaces:
Running
Running
File size: 790 Bytes
f7ba720 |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 |
macros:
"latest-llama": >
/app/llama.cpp/build/bin/llama-server
--port ${PORT}
--no-mmap
--threads 2
models:
"Ernie-4.5-0.3B":
cmd: |
${latest-llama}
-m /app/llama.cpp/build/ERNIE-4.5-0.3B-PT-UD-Q8_K_XL.gguf
-c 32000
--jinja
ttl: 360
"LFM2-VL-450M":
cmd: |
${latest-llama}
-m /app/llama.cpp/build/LFM2-VL-450M-Q8_0.gguf
--mmproj /app/llama.cpp/build/mmproj-LFM2-VL-450M-F16.gguf
-c 32000
ttl: 360
"gemma-3-270m-it":
cmd: |
${latest-llama}
-m /app/llama.cpp/build/gemma-3-270m-it-UD-Q8_K_XL.gguf
-c 32000
--jinja
ttl: 360
"Qwen3-0.6B":
cmd: |
${latest-llama}
-m /app/llama.cpp/build/Qwen3-0.6B-UD-Q8_K_XL.gguf
-c 32000
--jinja
ttl: 360
|