Spaces:

SkyNetWalker
/

chatCPU

Running

SkyNetWalker commited on Jun 26

Commit

105d6cf

verified ·

1 Parent(s): 3087f19

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -101,8 +101,8 @@ with gr.Blocks(theme=gr.themes.Default(primary_hue="blue", secondary_hue="neutra
         """
         #Disable Qwen3 thinking
-        #if "Qwen3".lower() in current_selected_model:
-        #    system_prompt = system_prompt+" /no_think"
         # The 'history' variable from Gradio contains the entire conversation.
         # We prepend the system prompt to this history to form the final payload.
@@ -116,8 +116,7 @@ with gr.Blocks(theme=gr.themes.Default(primary_hue="blue", secondary_hue="neutra
         response_stream = ollama.chat(
             model=current_selected_model, # Use the dynamically selected model
             messages=messages,
-            stream=True,
-            think=False
         )
         # Iterate through the stream, updating the placeholder with each new chunk.

         """
         #Disable Qwen3 thinking
+        if "Qwen3".lower() in current_selected_model:
+            system_prompt = system_prompt+" /no_think"
         # The 'history' variable from Gradio contains the entire conversation.
         # We prepend the system prompt to this history to form the final payload.
         response_stream = ollama.chat(
             model=current_selected_model, # Use the dynamically selected model
             messages=messages,
+            stream=True
         )
         # Iterate through the stream, updating the placeholder with each new chunk.