Spaces:

Futuresony
/

FuturesonyAi

Runtime error

App Files Files Community

Futuresony commited on Dec 12, 2024

Commit

3f65533

verified ·

1 Parent(s): 80ad184

Update app.py

Browse files

Files changed (1) hide show

app.py +36 -20

app.py CHANGED Viewed

@@ -4,17 +4,15 @@ from huggingface_hub import InferenceClient
 """
 For more information on `huggingface_hub` Inference API support, please check the docs: https://huggingface.co/docs/huggingface_hub/v0.22.2/en/guides/inference
 """
-client = InferenceClient("Futuresony/future_ai_12_10_2024.gguf")
-def respond(
-    message,
-    history: list[tuple[str, str]],
-    system_message,
-    max_tokens,
-    temperature,
-    top_p,
-):
     messages = [{"role": "system", "content": system_message}]
     for val in history:
@@ -29,10 +27,10 @@ def respond(
     for message in client.chat_completion(
         messages,
-        max_tokens=max_tokens,
         stream=True,
-        temperature=temperature,
-        top_p=top_p,
     ):
         token = message.choices[0].delta.content
@@ -40,16 +38,34 @@ def respond(
         yield response
-"""
-For information on how to customize the ChatInterface, peruse the gradio docs: https://www.gradio.app/docs/chatinterface
-"""
 if __name__ == "__main__":
-   """
     demo.launch()
-    """
-    app.run(debug=True, port=7860)

 """
 For more information on `huggingface_hub` Inference API support, please check the docs: https://huggingface.co/docs/huggingface_hub/v0.22.2/en/guides/inference
 """
+client = InferenceClient(model="Futuresony/future_ai_12_10_2024.gguf")
+# Set fixed parameters
+MAX_TOKENS = 512
+TEMPERATURE = 0.7
+TOP_P = 0.95
+def respond(message, history: list[tuple[str, str]], system_message):
     messages = [{"role": "system", "content": system_message}]
     for val in history:
     for message in client.chat_completion(
         messages,
+        max_tokens=MAX_TOKENS,
         stream=True,
+        temperature=TEMPERATURE,
+        top_p=TOP_P,
     ):
         token = message.choices[0].delta.content
         yield response
+# Gradio interface setup
+with gr.Blocks() as demo:
+    # Chatbot Interface
+    chatbot = gr.Chatbot()
+    state = gr.State([])
+    system_message = gr.Textbox(
+        value="You are a helpful assistant.",
+        label="System Prompt",
+        placeholder="Enter system instructions here...",
+    )
+    user_message = gr.Textbox(label="Your Message", placeholder="Type your message...")
+    send_button = gr.Button("Send")
+    # Function to handle user inputs and display assistant responses
+    def chat(user_input, chat_history, sys_msg):
+        response_generator = respond(user_input, chat_history, sys_msg)
+        response = ""
+        for partial_response in response_generator:
+            response = partial_response
+        chat_history.append((user_input, response))
+        return chat_history, chat_history
+    send_button.click(
+        chat,
+        inputs=[user_message, state, system_message],
+        outputs=[chatbot, state],
+    )
 if __name__ == "__main__":
     demo.launch()