Spaces:
Running
Running
Update app.py
Browse files
app.py
CHANGED
@@ -9,17 +9,11 @@ import ollama
|
|
9 |
|
10 |
# List of available models for selection.
|
11 |
# IMPORTANT: These names must correspond to models that have been either
|
12 |
-
# 'ollama create'd from a Modelfile or 'ollama pull'ed within your Hugging Face Space.
|
13 |
-
#ollama pull hf.co/unsloth/gemma-3-4b-it-qat-GGUF:Q4_K_M
|
14 |
-
#ollama pull hf.co/Menlo/Jan-nano-128k-gguf:Q4_K_M
|
15 |
-
#ollama pull hf.co/bartowski/Qwen_Qwen3-4B-GGUF:Q4_K_M
|
16 |
-
#ollama pull hf.co/bartowski/Qwen_Qwen3-1.7B-GGUF:Q5_K_M
|
17 |
-
#ollama pull hf.co/bartowski/Llama-3.2-3B-Instruct-GGUF:Q4_K_M
|
18 |
-
|
19 |
|
20 |
# Model from run.sh
|
21 |
AVAILABLE_MODELS = [
|
22 |
'smollm2:360m-instruct-q5_K_M',
|
|
|
23 |
'hf.co/bartowski/Llama-3.2-3B-Instruct-GGUF:Q4_K_M', # OK speed with CPU
|
24 |
'hf.co/unsloth/gemma-3-4b-it-qat-GGUF:Q4_K_M', #Slow.
|
25 |
'hf.co/bartowski/Qwen_Qwen3-1.7B-GGUF:Q5_K_M',
|
@@ -40,7 +34,7 @@ with gr.Blocks(theme=gr.themes.Default(primary_hue="blue", secondary_hue="neutra
|
|
40 |
with gr.Row():
|
41 |
selected_model = gr.Radio(
|
42 |
choices=AVAILABLE_MODELS,
|
43 |
-
value=AVAILABLE_MODELS[
|
44 |
label="Select Model",
|
45 |
info="Choose the LLM model to chat with.",
|
46 |
interactive=True
|
|
|
9 |
|
10 |
# List of available models for selection.
|
11 |
# IMPORTANT: These names must correspond to models that have been either
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
12 |
|
13 |
# Model from run.sh
|
14 |
AVAILABLE_MODELS = [
|
15 |
'smollm2:360m-instruct-q5_K_M',
|
16 |
+
'hf.co/unsloth/LFM2-1.2B-GGUF:Q5_K_M',
|
17 |
'hf.co/bartowski/Llama-3.2-3B-Instruct-GGUF:Q4_K_M', # OK speed with CPU
|
18 |
'hf.co/unsloth/gemma-3-4b-it-qat-GGUF:Q4_K_M', #Slow.
|
19 |
'hf.co/bartowski/Qwen_Qwen3-1.7B-GGUF:Q5_K_M',
|
|
|
34 |
with gr.Row():
|
35 |
selected_model = gr.Radio(
|
36 |
choices=AVAILABLE_MODELS,
|
37 |
+
value=AVAILABLE_MODELS[1], # Default to the first model in the list
|
38 |
label="Select Model",
|
39 |
info="Choose the LLM model to chat with.",
|
40 |
interactive=True
|