Spaces:
Running
Running
Update run.sh
Browse files
run.sh
CHANGED
@@ -4,23 +4,18 @@
|
|
4 |
ollama serve &
|
5 |
|
6 |
# Wait a few seconds for the server to be fully operational
|
7 |
-
sleep
|
8 |
|
9 |
# Pull the model from Hugging Face.
|
10 |
# This command downloads the model and makes it available to the API.
|
11 |
# It's the non-interactive version of "ollama run".
|
12 |
-
ollama pull hf.co/bartowski/Qwen_Qwen3-4B-Instruct-2507-GGUF:Q4_K_M
|
13 |
#ollama pull hf.co/bartowski/Qwen_Qwen3-4B-Thinking-2507-GGUF:Q4_K_M
|
14 |
-
ollama pull smollm2:360m-instruct-q5_K_M
|
15 |
-
ollama pull hf.co/bartowski/Llama-3.2-3B-Instruct-GGUF:Q4_K_M
|
16 |
#ollama pull gemma3n:e2b-it-q4_K_M #slow on Spaces CPU
|
17 |
-
ollama pull granite3.3:2b
|
18 |
-
ollama pull hf.co/bartowski/tencent_Hunyuan-4B-Instruct-GGUF:Q4_K_M
|
19 |
-
|
20 |
-
|
21 |
-
#---- 20250722 fail to run
|
22 |
-
#ollama pull hf.co/ggml-org/SmolLM3-3B-GGUF:Q4_K_M
|
23 |
-
#ollama pull hf.co/bartowski/nvidia_OpenReasoning-Nemotron-1.5B-GGUF:Q5_K_M
|
24 |
|
25 |
|
26 |
# Start the Gradio web application
|
|
|
4 |
ollama serve &
|
5 |
|
6 |
# Wait a few seconds for the server to be fully operational
|
7 |
+
sleep 10
|
8 |
|
9 |
# Pull the model from Hugging Face.
|
10 |
# This command downloads the model and makes it available to the API.
|
11 |
# It's the non-interactive version of "ollama run".
|
12 |
+
ollama pull 'hf.co/bartowski/Qwen_Qwen3-4B-Instruct-2507-GGUF:Q4_K_M'
|
13 |
#ollama pull hf.co/bartowski/Qwen_Qwen3-4B-Thinking-2507-GGUF:Q4_K_M
|
14 |
+
ollama pull 'smollm2:360m-instruct-q5_K_M'
|
15 |
+
ollama pull 'hf.co/bartowski/Llama-3.2-3B-Instruct-GGUF:Q4_K_M'
|
16 |
#ollama pull gemma3n:e2b-it-q4_K_M #slow on Spaces CPU
|
17 |
+
ollama pull 'granite3.3:2b'
|
18 |
+
ollama pull 'hf.co/bartowski/tencent_Hunyuan-4B-Instruct-GGUF:Q4_K_M'
|
|
|
|
|
|
|
|
|
|
|
19 |
|
20 |
|
21 |
# Start the Gradio web application
|