SkyNetWalker commited on
Commit
7362f63
·
verified ·
1 Parent(s): 565c016

Update run.sh

Browse files
Files changed (1) hide show
  1. run.sh +6 -11
run.sh CHANGED
@@ -4,23 +4,18 @@
4
  ollama serve &
5
 
6
  # Wait a few seconds for the server to be fully operational
7
- sleep 5
8
 
9
  # Pull the model from Hugging Face.
10
  # This command downloads the model and makes it available to the API.
11
  # It's the non-interactive version of "ollama run".
12
- ollama pull hf.co/bartowski/Qwen_Qwen3-4B-Instruct-2507-GGUF:Q4_K_M
13
  #ollama pull hf.co/bartowski/Qwen_Qwen3-4B-Thinking-2507-GGUF:Q4_K_M
14
- ollama pull smollm2:360m-instruct-q5_K_M
15
- ollama pull hf.co/bartowski/Llama-3.2-3B-Instruct-GGUF:Q4_K_M
16
  #ollama pull gemma3n:e2b-it-q4_K_M #slow on Spaces CPU
17
- ollama pull granite3.3:2b
18
- ollama pull hf.co/bartowski/tencent_Hunyuan-4B-Instruct-GGUF:Q4_K_M
19
-
20
-
21
- #---- 20250722 fail to run
22
- #ollama pull hf.co/ggml-org/SmolLM3-3B-GGUF:Q4_K_M
23
- #ollama pull hf.co/bartowski/nvidia_OpenReasoning-Nemotron-1.5B-GGUF:Q5_K_M
24
 
25
 
26
  # Start the Gradio web application
 
4
  ollama serve &
5
 
6
  # Wait a few seconds for the server to be fully operational
7
+ sleep 10
8
 
9
  # Pull the model from Hugging Face.
10
  # This command downloads the model and makes it available to the API.
11
  # It's the non-interactive version of "ollama run".
12
+ ollama pull 'hf.co/bartowski/Qwen_Qwen3-4B-Instruct-2507-GGUF:Q4_K_M'
13
  #ollama pull hf.co/bartowski/Qwen_Qwen3-4B-Thinking-2507-GGUF:Q4_K_M
14
+ ollama pull 'smollm2:360m-instruct-q5_K_M'
15
+ ollama pull 'hf.co/bartowski/Llama-3.2-3B-Instruct-GGUF:Q4_K_M'
16
  #ollama pull gemma3n:e2b-it-q4_K_M #slow on Spaces CPU
17
+ ollama pull 'granite3.3:2b'
18
+ ollama pull 'hf.co/bartowski/tencent_Hunyuan-4B-Instruct-GGUF:Q4_K_M'
 
 
 
 
 
19
 
20
 
21
  # Start the Gradio web application