Spaces:

lemonteaa
/

edge_llm_chat

Running

edge_llm_chat / config.yaml

Create config.yaml

f7ba720 verified 11 days ago

790 Bytes

	macros:
	"latest-llama": >
	/app/llama.cpp/build/bin/llama-server
	--port ${PORT}
	--no-mmap
	--threads 2

	models:
	"Ernie-4.5-0.3B":
	cmd: \|
	${latest-llama}
	-m /app/llama.cpp/build/ERNIE-4.5-0.3B-PT-UD-Q8_K_XL.gguf
	-c 32000
	--jinja
	ttl: 360
	"LFM2-VL-450M":
	cmd: \|
	${latest-llama}
	-m /app/llama.cpp/build/LFM2-VL-450M-Q8_0.gguf
	--mmproj /app/llama.cpp/build/mmproj-LFM2-VL-450M-F16.gguf
	-c 32000
	ttl: 360
	"gemma-3-270m-it":
	cmd: \|
	${latest-llama}
	-m /app/llama.cpp/build/gemma-3-270m-it-UD-Q8_K_XL.gguf
	-c 32000
	--jinja
	ttl: 360
	"Qwen3-0.6B":
	cmd: \|
	${latest-llama}
	-m /app/llama.cpp/build/Qwen3-0.6B-UD-Q8_K_XL.gguf
	-c 32000
	--jinja
	ttl: 360