Spaces:

Hev832
/

chat

Sleeping

App Files Files Community

Hev832 commited on Sep 9, 2024

Commit

e398ade

verified ·

1 Parent(s): 05d3da7

Update app.py

Browse files

Files changed (1) hide show

app.py +35 -24

app.py CHANGED Viewed

@@ -1,9 +1,6 @@
 import gradio as gr
 from huggingface_hub import InferenceClient
-"""
-For more information on `huggingface_hub` Inference API support, please check the docs: https://huggingface.co/docs/huggingface_hub/v0.22.2/en/guides/inference
-"""
 client = InferenceClient("HuggingFaceH4/zephyr-7b-beta")
@@ -26,7 +23,6 @@ def respond(
     messages.append({"role": "user", "content": message})
     response = ""
     for message in client.chat_completion(
         messages,
         max_tokens=max_tokens,
@@ -35,29 +31,44 @@ def respond(
         top_p=top_p,
     ):
         token = message.choices[0].delta.content
         response += token
         yield response
-"""
-For information on how to customize the ChatInterface, peruse the gradio docs: https://www.gradio.app/docs/chatinterface
-"""
-demo = gr.ChatInterface(
-    respond,
-    additional_inputs=[
-        gr.Textbox(value="You are a friendly Chatbot.", label="System message"),
-        gr.Slider(minimum=1, maximum=2048, value=512, step=1, label="Max new tokens"),
-        gr.Slider(minimum=0.1, maximum=4.0, value=0.7, step=0.1, label="Temperature"),
-        gr.Slider(
-            minimum=0.1,
-            maximum=1.0,
-            value=0.95,
-            step=0.05,
-            label="Top-p (nucleus sampling)",
-        ),
-    ],
-)
 if __name__ == "__main__":
-    demo.launch()

 import gradio as gr
 from huggingface_hub import InferenceClient
 client = InferenceClient("HuggingFaceH4/zephyr-7b-beta")
     messages.append({"role": "user", "content": message})
     response = ""
     for message in client.chat_completion(
         messages,
         max_tokens=max_tokens,
         top_p=top_p,
     ):
         token = message.choices[0].delta.content
         response += token
         yield response
+with gr.Blocks() as demo:
+    system_message = gr.Textbox(
+        label="System Message",
+        value="You are a helpful assistant.",
+        lines=2,
+    )
+    chat_history = gr.State([])
+    with gr.Row():
+        with gr.Column(scale=0.8):
+            chatbot = gr.Chatbot()
+        with gr.Column(scale=0.2):
+            max_tokens = gr.Slider(
+                minimum=1, maximum=512, step=1, value=128, label="Max Tokens"
+            )
+            temperature = gr.Slider(
+                minimum=0, maximum=1, step=0.01, value=0.7, label="Temperature"
+            )
+            top_p = gr.Slider(
+                minimum=0, maximum=1, step=0.01, value=1, label="Top-p"
+            )
+    user_input = gr.Textbox(show_label=False, placeholder="Type your message here...")
+    def user_interaction(message, history, system_message, max_tokens, temperature, top_p):
+        bot_message = next(respond(message, history, system_message, max_tokens, temperature, top_p))
+        history.append((message, bot_message))
+        return history, history
+    user_input.submit(
+        user_interaction,
+        inputs=[user_input, chat_history, system_message, max_tokens, temperature, top_p],
+        outputs=[chatbot, chat_history],
+    )
 if __name__ == "__main__":
+    demo.launch()