Reasoning_Assistant

Sleeping

Daemontatox commited on May 19

Commit

bc8a2e7

verified ·

1 Parent(s): 51a8301

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -5,14 +5,14 @@ import torch
 from threading import Thread
 import re
-phi4_model_path = "Qwen/Qwen3-30B-A3B"
 device = "cuda:0" if torch.cuda.is_available() else "cpu"
 phi4_model = AutoModelForCausalLM.from_pretrained(phi4_model_path, device_map="auto", torch_dtype="auto")
 phi4_tokenizer = AutoTokenizer.from_pretrained(phi4_model_path)
-@spaces.GPU(duration=120)
 def generate_response(user_message, max_tokens, temperature, top_k, top_p, repetition_penalty, history_state):
     if not user_message.strip():
         return history_state, history_state

 from threading import Thread
 import re
+phi4_model_path = "Daemontatox/Qwen3-14B-Griffon"
 device = "cuda:0" if torch.cuda.is_available() else "cpu"
 phi4_model = AutoModelForCausalLM.from_pretrained(phi4_model_path, device_map="auto", torch_dtype="auto")
 phi4_tokenizer = AutoTokenizer.from_pretrained(phi4_model_path)
+@spaces.GPU(duration=60)
 def generate_response(user_message, max_tokens, temperature, top_k, top_p, repetition_penalty, history_state):
     if not user_message.strip():
         return history_state, history_state