Spaces:
Running
Running
macros: | |
"latest-llama": > | |
/app/llama.cpp/build/bin/llama-server | |
--port ${PORT} | |
--no-mmap | |
--threads 2 | |
models: | |
"Ernie-4.5-0.3B": | |
cmd: | | |
${latest-llama} | |
-m /app/llama.cpp/build/ERNIE-4.5-0.3B-PT-UD-Q8_K_XL.gguf | |
-c 32000 | |
--jinja | |
ttl: 360 | |
"LFM2-VL-450M": | |
cmd: | | |
${latest-llama} | |
-m /app/llama.cpp/build/LFM2-VL-450M-Q8_0.gguf | |
--mmproj /app/llama.cpp/build/mmproj-LFM2-VL-450M-F16.gguf | |
-c 32000 | |
ttl: 360 | |
"gemma-3-270m-it": | |
cmd: | | |
${latest-llama} | |
-m /app/llama.cpp/build/gemma-3-270m-it-UD-Q8_K_XL.gguf | |
-c 32000 | |
--jinja | |
ttl: 360 | |
"Qwen3-0.6B": | |
cmd: | | |
${latest-llama} | |
-m /app/llama.cpp/build/Qwen3-0.6B-UD-Q8_K_XL.gguf | |
-c 32000 | |
--jinja | |
ttl: 360 | |