Spaces:

SkyNetWalker
/

chatCPU

Running

SkyNetWalker commited on Jun 26

Commit

3087f19

verified ·

1 Parent(s): 5986c8e

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -100,6 +100,10 @@ with gr.Blocks(theme=gr.themes.Default(primary_hue="blue", secondary_hue="neutra
         and streams the response back to the chatbot.
         """
         # The 'history' variable from Gradio contains the entire conversation.
         # We prepend the system prompt to this history to form the final payload.
         messages = [{"role": "system", "content": system_prompt}] + history
@@ -112,7 +116,8 @@ with gr.Blocks(theme=gr.themes.Default(primary_hue="blue", secondary_hue="neutra
         response_stream = ollama.chat(
             model=current_selected_model, # Use the dynamically selected model
             messages=messages,
-            stream=True
         )
         # Iterate through the stream, updating the placeholder with each new chunk.

         and streams the response back to the chatbot.
         """
+        #Disable Qwen3 thinking
+        #if "Qwen3".lower() in current_selected_model:
+        #    system_prompt = system_prompt+" /no_think"
         # The 'history' variable from Gradio contains the entire conversation.
         # We prepend the system prompt to this history to form the final payload.
         messages = [{"role": "system", "content": system_prompt}] + history
         response_stream = ollama.chat(
             model=current_selected_model, # Use the dynamically selected model
             messages=messages,
+            stream=True,
+            think=False
         )
         # Iterate through the stream, updating the placeholder with each new chunk.