Spaces:

alibayram
/

usta-llm-demo

Running

App Files Files Community

alibayram commited on 23 days ago

Commit

39dfa2d

1 Parent(s): 0eefbc1

space update

Browse files

Files changed (1) hide show

app.py +45 -92

app.py CHANGED Viewed

@@ -182,30 +182,12 @@ def load_model_from_file(uploaded_file):
         model_status = error_msg
         return error_msg
-def respond(
-    message,
-    history: list[tuple[str, str]],
-    system_message,
-    max_tokens,
-    temperature,
-    top_p,
-    model_file,
-    model_url,
-    load_file_btn,
-    load_url_btn,
-    status_display
-):
-    """
-    Generate a response using the UstaModel
-    """
     if model is None or tokenizer is None:
-        yield "Sorry, the UstaModel is not available. Please try again later."
-        return
     try:
-        # For UstaModel, we'll use the message directly (ignoring system_message for now)
-        # since it's a simpler model focused on geographical knowledge
         # Encode the input message
         tokens = tokenizer.encode(message)
@@ -215,7 +197,6 @@ def respond(
         # Generate response
         with torch.no_grad():
-            # Use max_tokens parameter, but cap it at reasonable limit for this model
             actual_max_tokens = min(max_tokens, 32 - len(tokens))
             generated_tokens = model.generate(tokens, actual_max_tokens)
@@ -233,104 +214,76 @@ def respond(
         if not response:
             response = "I'm not sure how to respond to that with my geographical knowledge."
-        # Yield the response (to maintain compatibility with streaming interface)
-        yield response
     except Exception as e:
-        yield f"Sorry, I encountered an error: {str(e)}"
-# Create a Blocks interface to properly handle events
-with gr.Blocks(title="🤖 Usta Model Chat", theme=gr.themes.Soft()) as demo:
     gr.Markdown("# 🤖 Usta Model Chat")
-    gr.Markdown("Chat with a custom transformer language model built from scratch! Upload your own model file or provide a URL to load a different model.")
-    # Model loading section
-    with gr.Accordion("🔧 Model Loading Options", open=False):
-        with gr.Row():
-            with gr.Column():
-                gr.Markdown("### 📁 Upload Model File")
-                model_file = gr.File(label="Upload Model File (.pth)", file_types=[".pth", ".pt"])
-                load_file_btn = gr.Button("Load from File", variant="primary")
-            with gr.Column():
-                gr.Markdown("### 🔗 Load from URL")
-                model_url = gr.Textbox(label="Model URL", placeholder="https://github.com/malibayram/llm-from-scratch/raw/main/u_model_4000.pth")
-                load_url_btn = gr.Button("Load from URL", variant="primary")
-        status_display = gr.Textbox(label="Model Status", value=model_status, interactive=False)
-    # Chat interface (simpler version)
-    chatbot = gr.Chatbot(label="Chat", type="messages")
-    msg = gr.Textbox(label="Message", placeholder="Type your message here...")
     # Generation settings
-    with gr.Accordion("⚙️ Generation Settings", open=False):
-        system_msg = gr.Textbox(
-            value="You are Usta, a geographical knowledge assistant trained from scratch.",
-            label="System message"
         )
-        max_tokens = gr.Slider(minimum=1, maximum=30, value=20, step=1, label="Max new tokens")
-        temperature = gr.Slider(minimum=0.1, maximum=2.0, value=1.0, step=0.1, label="Temperature")
-        top_p = gr.Slider(minimum=0.1, maximum=1.0, value=0.95, step=0.05, label="Top-p")
-    # Button controls
     with gr.Row():
-        submit_btn = gr.Button("Send", variant="primary")
-        clear_btn = gr.Button("Clear Chat", variant="secondary")
     # Event handlers
-    def chat_respond(message, history, sys_msg, max_tok, temp, top_p_val):
         if not message.strip():
             return history, ""
-        # Convert messages format for our respond function
-        tuple_history = [(h["role"], h["content"]) for h in history if h["role"] != "system"]
-        # Generate response using our existing function
-        response_gen = respond(
-            message, tuple_history, sys_msg, max_tok, temp, top_p_val,
-            None, None, None, None, None  # Dummy values for unused params
-        )
-        # Get the response
-        response = ""
-        for r in response_gen:
-            response = r
-        # Add to history in messages format
-        history.append({"role": "user", "content": message})
-        history.append({"role": "assistant", "content": response})
-        return history, ""
-    # Set up event handlers
-    submit_btn.click(
-        chat_respond,
-        inputs=[msg, chatbot, system_msg, max_tokens, temperature, top_p],
         outputs=[chatbot, msg]
     )
     msg.submit(
-        chat_respond,
-        inputs=[msg, chatbot, system_msg, max_tokens, temperature, top_p],
         outputs=[chatbot, msg]
     )
-    clear_btn.click(
-        lambda: ([], ""),
-        outputs=[chatbot, msg]
     )
     load_file_btn.click(
         load_model_from_file,
         inputs=[model_file],
-        outputs=[status_display]
-    )
-    load_url_btn.click(
-        load_model_from_url,
-        inputs=[model_url],
-        outputs=[status_display]
     )
 if __name__ == "__main__":

         model_status = error_msg
         return error_msg
+def chat_with_usta(message, history, max_tokens=20):
+    """Simple chat function"""
     if model is None or tokenizer is None:
+        return history + [["Error", "UstaModel is not available. Please try again later."]]
     try:
         # Encode the input message
         tokens = tokenizer.encode(message)
         # Generate response
         with torch.no_grad():
             actual_max_tokens = min(max_tokens, 32 - len(tokens))
             generated_tokens = model.generate(tokens, actual_max_tokens)
         if not response:
             response = "I'm not sure how to respond to that with my geographical knowledge."
+        # Add to history
+        history.append([message, response])
+        return history
     except Exception as e:
+        history.append([message, f"Sorry, I encountered an error: {str(e)}"])
+        return history
+# Create simple interface
+with gr.Blocks(title="🤖 Usta Model Chat") as demo:
     gr.Markdown("# 🤖 Usta Model Chat")
+    gr.Markdown("Chat with a custom transformer language model built from scratch! This model specializes in geographical knowledge.")
+    # Simple chat interface
+    chatbot = gr.Chatbot(height=400)
+    msg = gr.Textbox(label="Your message", placeholder="Ask about countries, capitals, or cities...")
+    with gr.Row():
+        send_btn = gr.Button("Send", variant="primary")
+        clear_btn = gr.Button("Clear")
     # Generation settings
+    max_tokens = gr.Slider(minimum=1, maximum=30, value=20, step=1, label="Max tokens")
+    # Model loading (simplified)
+    gr.Markdown("## 🔧 Load Custom Model (Optional)")
+    with gr.Row():
+        model_url = gr.Textbox(
+            label="Model URL",
+            placeholder="https://github.com/malibayram/llm-from-scratch/raw/main/u_model_4000.pth",
+            scale=3
         )
+        load_url_btn = gr.Button("Load from URL", scale=1)
     with gr.Row():
+        model_file = gr.File(label="Upload .pth file", file_types=[".pth"])
+        load_file_btn = gr.Button("Load File", scale=1)
+    status = gr.Textbox(label="Status", value=model_status, interactive=False)
     # Event handlers
+    def send_message(message, history, max_tok):
         if not message.strip():
             return history, ""
+        return chat_with_usta(message, history, max_tok), ""
+    send_btn.click(
+        send_message,
+        inputs=[msg, chatbot, max_tokens],
         outputs=[chatbot, msg]
     )
     msg.submit(
+        send_message,
+        inputs=[msg, chatbot, max_tokens],
         outputs=[chatbot, msg]
     )
+    clear_btn.click(lambda: [], outputs=[chatbot])
+    load_url_btn.click(
+        load_model_from_url,
+        inputs=[model_url],
+        outputs=[status]
     )
     load_file_btn.click(
         load_model_from_file,
         inputs=[model_file],
+        outputs=[status]
     )
 if __name__ == "__main__":