Spaces:

abhi1nandy2
/

my-chatbot

Runtime error

App Files Files Community

abhi1nandy2 commited on Feb 7

Commit

7ea7d8d

verified ·

1 Parent(s): 6761a81

Update app.py

Browse files

Files changed (1) hide show

app.py +6 -9

app.py CHANGED Viewed

@@ -18,7 +18,7 @@ def get_text_from_url(url):
     visible_texts = filter(tag_visible, texts)
     return "\n".join(t.strip() for t in visible_texts)
-# Get the text from your homepage (and any additional extensions as needed)
 text_list = []
 homepage_url = "https://sites.google.com/view/abhilashnandy/home/"
 extensions = ["", "pmrf-profile-page"]
@@ -26,18 +26,15 @@ for ext in extensions:
     url_text = get_text_from_url(homepage_url + ext)
     text_list.append(url_text)
-# Optionally, repeat for sub-links if necessary
-# Build a system message with the homepage info
 SYSTEM_MESSAGE = (
     "You are a QA chatbot to answer queries (in less than 30 words) on my homepage that has the following information -\n\n"
     + "\n\n".join(text_list)
     + "\n\n"
 )
-# Use a model that works well on CPU, has a decently long context, and low inference latency.
-# Here we choose a small chat-optimized model:
-client = InferenceClient("TheBloke/TinyLlama-1.1B-Chat-v1.0-GGUF")
 def respond(message, history: list[tuple[str, str]], system_message=SYSTEM_MESSAGE,
             max_tokens=140, temperature=0.7, top_p=0.95):
@@ -54,7 +51,7 @@ def respond(message, history: list[tuple[str, str]], system_message=SYSTEM_MESSA
             max_tokens=max_tokens,
             temperature=temperature,
             top_p=top_p,
-            # stream=True,  # Uncomment to enable streaming
         )
         return response.choices[0].message["content"]
     except Exception as e:
@@ -71,7 +68,7 @@ with demo:
         fn=respond,
         examples=["Yo who dis Abhilash?", "What is Abhilash's most recent publication?"],
         additional_inputs=[
-            # You can add extra Gradio components here if needed.
         ],
     )

     visible_texts = filter(tag_visible, texts)
     return "\n".join(t.strip() for t in visible_texts)
+# Gather text from your homepage (and any extensions)
 text_list = []
 homepage_url = "https://sites.google.com/view/abhilashnandy/home/"
 extensions = ["", "pmrf-profile-page"]
     url_text = get_text_from_url(homepage_url + ext)
     text_list.append(url_text)
+# Build the system message with homepage info.
 SYSTEM_MESSAGE = (
     "You are a QA chatbot to answer queries (in less than 30 words) on my homepage that has the following information -\n\n"
     + "\n\n".join(text_list)
     + "\n\n"
 )
+# Use the GPTQ variant of TinyLlama which includes the tokenizer configuration
+client = InferenceClient("TheBloke/TinyLlama-1.1B-Chat-v1.0-GPTQ")
 def respond(message, history: list[tuple[str, str]], system_message=SYSTEM_MESSAGE,
             max_tokens=140, temperature=0.7, top_p=0.95):
             max_tokens=max_tokens,
             temperature=temperature,
             top_p=top_p,
+            # stream=True,  # Uncomment this if you want streaming output for debugging.
         )
         return response.choices[0].message["content"]
     except Exception as e:
         fn=respond,
         examples=["Yo who dis Abhilash?", "What is Abhilash's most recent publication?"],
         additional_inputs=[
+            # Additional components can be added here if needed.
         ],
     )