Spaces:

arjunanand13
/

llama-2-7b-chatbot

Runtime error

App Files Files Community

arjunanand13 commited on Apr 23, 2024

Commit

039ca7e

verified ·

1 Parent(s): 81b36e5

Update app.py

Browse files

Files changed (1) hide show

app.py +8 -14

app.py CHANGED Viewed

@@ -16,13 +16,13 @@ pipeline = transformers.pipeline(
 )
 def chat_function(message, history, system_prompt, max_new_tokens, temperature):
-    # Assuming history is a list of tuples (user_message, assistant_message)
     messages = []
-    for user_msg, assistant_msg in history:
-        messages.append({"role": "user", "content": user_msg})
-        messages.append({"role": "assistant", "content": assistant_msg})
-    # Add the current user message
     messages.append({"role": "user", "content": message})
     # Construct the prompt using the pipeline's tokenizer
@@ -32,12 +32,6 @@ def chat_function(message, history, system_prompt, max_new_tokens, temperature):
         add_generation_prompt=True
     )
-    # Generate the response
-    terminators = [
-        pipeline.tokenizer.eos_token_id,
-        pipeline.tokenizer.convert_tokens_to_ids("")
-    ]
     # Adjust the temperature slightly above given to ensure variety
     adjusted_temp = temperature + 0.1
@@ -45,7 +39,6 @@ def chat_function(message, history, system_prompt, max_new_tokens, temperature):
     outputs = pipeline(
         prompt,
         max_new_tokens=max_new_tokens,
-        eos_token_id=terminators,
         do_sample=True,
         temperature=adjusted_temp,
         top_p=0.9
@@ -55,12 +48,12 @@ def chat_function(message, history, system_prompt, max_new_tokens, temperature):
     generated_text = outputs[0]["generated_text"]
     return generated_text[len(prompt):]  # Return the new part of the conversation
-#Gradio interface setup
 gr.Interface(
     fn=chat_function,
     inputs=[
         gr.Textbox(placeholder="Enter your message here", label="Your Message"),
-        gr.JSON(label="Conversation History (format as [[user, assistant], ...])"),
         gr.Textbox(label="System Prompt"),
         gr.Slider(512, 4096, label="Max New Tokens"),
         gr.Slider(0.0, 1.0, step=0.1,  label="Temperature")
@@ -69,6 +62,7 @@ gr.Interface(
 ).launch()
 # def chat_function(message, history, system_prompt,max_new_tokens,temperature):
 #     messages = [
 #         {"role": "system", "content": system_prompt},

 )
 def chat_function(message, history, system_prompt, max_new_tokens, temperature):
     messages = []
+    if history is not None:
+        for user_msg, assistant_msg in history:
+            messages.append({"role": "user", "content": user_msg})
+            messages.append({"role": "assistant", "content": assistant_msg})
+    # Always add the current user message
     messages.append({"role": "user", "content": message})
     # Construct the prompt using the pipeline's tokenizer
         add_generation_prompt=True
     )
     # Adjust the temperature slightly above given to ensure variety
     adjusted_temp = temperature + 0.1
     outputs = pipeline(
         prompt,
         max_new_tokens=max_new_tokens,
         do_sample=True,
         temperature=adjusted_temp,
         top_p=0.9
     generated_text = outputs[0]["generated_text"]
     return generated_text[len(prompt):]  # Return the new part of the conversation
+# Update Gradio interface to reflect the potential nullability of history
 gr.Interface(
     fn=chat_function,
     inputs=[
         gr.Textbox(placeholder="Enter your message here", label="Your Message"),
+        gr.JSON(label="Conversation History (format as [[user, assistant], ...])", optional=True),  # Marked as optional
         gr.Textbox(label="System Prompt"),
         gr.Slider(512, 4096, label="Max New Tokens"),
         gr.Slider(0.0, 1.0, step=0.1,  label="Temperature")
 ).launch()
 # def chat_function(message, history, system_prompt,max_new_tokens,temperature):
 #     messages = [
 #         {"role": "system", "content": system_prompt},