Spaces:

alibayram
/

usta-llm-demo

Sleeping

App Files Files Community

alibayram commited on Jun 10

Commit

0eefbc1

1 Parent(s): ff7d616

space update

Browse files

Files changed (1) hide show

app.py +84 -38

app.py CHANGED Viewed

@@ -189,6 +189,11 @@ def respond(
     max_tokens,
     temperature,
     top_p,
 ):
     """
     Generate a response using the UstaModel
@@ -234,44 +239,88 @@ def respond(
     except Exception as e:
         yield f"Sorry, I encountered an error: {str(e)}"
-# Create the simple ChatInterface with additional inputs for model loading
-demo = gr.ChatInterface(
-    respond,
-    additional_inputs=[
-        gr.Textbox(
-            value="You are Usta, a geographical knowledge assistant trained from scratch.",
             label="System message"
-        ),
-        gr.Slider(minimum=1, maximum=30, value=20, step=1, label="Max new tokens"),
-        gr.Slider(minimum=0.1, maximum=2.0, value=1.0, step=0.1, label="Temperature"),
-        gr.Slider(
-            minimum=0.1,
-            maximum=1.0,
-            value=0.95,
-            step=0.05,
-            label="Top-p (nucleus sampling)"
-        ),
-        gr.File(label="Upload Model File (.pth)", file_types=[".pth", ".pt"]),
-        gr.Textbox(label="Or Model URL", placeholder="https://github.com/user/repo/raw/main/model.pth"),
-        gr.Button("Load from File", variant="secondary"),
-        gr.Button("Load from URL", variant="secondary"),
-        gr.Textbox(label="Model Status", value=model_status, interactive=False)
-    ],
-    title="🤖 Usta Model Chat",
-    description="Chat with a custom transformer language model built from scratch! Upload your own model file or provide a URL to load a different model."
-)
-# Add event handlers after creating the interface
-def setup_events():
-    # Get the additional inputs
-    inputs = demo.additional_inputs
-    model_file = inputs[4]  # File upload
-    model_url = inputs[5]   # URL input
-    load_file_btn = inputs[6]  # Load from file button
-    load_url_btn = inputs[7]   # Load from URL button
-    status_display = inputs[8]  # Status display
     # Set up event handlers
     load_file_btn.click(
         load_model_from_file,
         inputs=[model_file],
@@ -284,8 +333,5 @@ def setup_events():
         outputs=[status_display]
     )
-# Set up events after interface creation
-demo.load(setup_events)
 if __name__ == "__main__":
     demo.launch()

     max_tokens,
     temperature,
     top_p,
+    model_file,
+    model_url,
+    load_file_btn,
+    load_url_btn,
+    status_display
 ):
     """
     Generate a response using the UstaModel
     except Exception as e:
         yield f"Sorry, I encountered an error: {str(e)}"
+# Create a Blocks interface to properly handle events
+with gr.Blocks(title="🤖 Usta Model Chat", theme=gr.themes.Soft()) as demo:
+    gr.Markdown("# 🤖 Usta Model Chat")
+    gr.Markdown("Chat with a custom transformer language model built from scratch! Upload your own model file or provide a URL to load a different model.")
+    # Model loading section
+    with gr.Accordion("🔧 Model Loading Options", open=False):
+        with gr.Row():
+            with gr.Column():
+                gr.Markdown("### 📁 Upload Model File")
+                model_file = gr.File(label="Upload Model File (.pth)", file_types=[".pth", ".pt"])
+                load_file_btn = gr.Button("Load from File", variant="primary")
+            with gr.Column():
+                gr.Markdown("### 🔗 Load from URL")
+                model_url = gr.Textbox(label="Model URL", placeholder="https://github.com/malibayram/llm-from-scratch/raw/main/u_model_4000.pth")
+                load_url_btn = gr.Button("Load from URL", variant="primary")
+        status_display = gr.Textbox(label="Model Status", value=model_status, interactive=False)
+    # Chat interface (simpler version)
+    chatbot = gr.Chatbot(label="Chat", type="messages")
+    msg = gr.Textbox(label="Message", placeholder="Type your message here...")
+    # Generation settings
+    with gr.Accordion("⚙️ Generation Settings", open=False):
+        system_msg = gr.Textbox(
+            value="You are Usta, a geographical knowledge assistant trained from scratch.",
             label="System message"
+        )
+        max_tokens = gr.Slider(minimum=1, maximum=30, value=20, step=1, label="Max new tokens")
+        temperature = gr.Slider(minimum=0.1, maximum=2.0, value=1.0, step=0.1, label="Temperature")
+        top_p = gr.Slider(minimum=0.1, maximum=1.0, value=0.95, step=0.05, label="Top-p")
+    # Button controls
+    with gr.Row():
+        submit_btn = gr.Button("Send", variant="primary")
+        clear_btn = gr.Button("Clear Chat", variant="secondary")
+    # Event handlers
+    def chat_respond(message, history, sys_msg, max_tok, temp, top_p_val):
+        if not message.strip():
+            return history, ""
+        # Convert messages format for our respond function
+        tuple_history = [(h["role"], h["content"]) for h in history if h["role"] != "system"]
+        # Generate response using our existing function
+        response_gen = respond(
+            message, tuple_history, sys_msg, max_tok, temp, top_p_val,
+            None, None, None, None, None  # Dummy values for unused params
+        )
+        # Get the response
+        response = ""
+        for r in response_gen:
+            response = r
+        # Add to history in messages format
+        history.append({"role": "user", "content": message})
+        history.append({"role": "assistant", "content": response})
+        return history, ""
     # Set up event handlers
+    submit_btn.click(
+        chat_respond,
+        inputs=[msg, chatbot, system_msg, max_tokens, temperature, top_p],
+        outputs=[chatbot, msg]
+    )
+    msg.submit(
+        chat_respond,
+        inputs=[msg, chatbot, system_msg, max_tokens, temperature, top_p],
+        outputs=[chatbot, msg]
+    )
+    clear_btn.click(
+        lambda: ([], ""),
+        outputs=[chatbot, msg]
+    )
     load_file_btn.click(
         load_model_from_file,
         inputs=[model_file],
         outputs=[status_display]
     )
 if __name__ == "__main__":
     demo.launch()