Reasoning_Assistant

Sleeping

Daemontatox commited on May 1

Commit

40e1493

verified ·

1 Parent(s): 807df62

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -4,14 +4,14 @@ from transformers import AutoModelForCausalLM, AutoTokenizer, TextIteratorStream
 import torch
 from threading import Thread
-phi4_model_path = "Qwen/Qwen3-30B-A3B"
 device = "cuda:0" if torch.cuda.is_available() else "cpu"
 phi4_model = AutoModelForCausalLM.from_pretrained(phi4_model_path, device_map="auto", torch_dtype="auto")
 phi4_tokenizer = AutoTokenizer.from_pretrained(phi4_model_path)
-@spaces.GPU(duration=60)
 def generate_response(user_message, max_tokens, temperature, top_k, top_p, repetition_penalty, history_state):
     if not user_message.strip():
         return history_state, history_state

 import torch
 from threading import Thread
+phi4_model_path = "microsoft/Phi-4-reasoning-plus"
 device = "cuda:0" if torch.cuda.is_available() else "cpu"
 phi4_model = AutoModelForCausalLM.from_pretrained(phi4_model_path, device_map="auto", torch_dtype="auto")
 phi4_tokenizer = AutoTokenizer.from_pretrained(phi4_model_path)
+@spaces.GPU(duration=120)
 def generate_response(user_message, max_tokens, temperature, top_k, top_p, repetition_penalty, history_state):
     if not user_message.strip():
         return history_state, history_state