Spaces:

ATK20
/

Final_Assignment_Template1

Sleeping

App Files Files Community

ATK20 commited on Apr 26

Commit

1175283

verified ·

1 Parent(s): 8a642b5

Update app.py

Browse files

Files changed (1) hide show

app.py +85 -39

app.py CHANGED Viewed

@@ -71,17 +71,22 @@ class LLMInterface:
     def query_llm(prompt: str) -> str:
         """Query a free LLM through Hugging Face's inference API"""
         try:
-            # Using FLAN-T5-XXL which is available for free
-            API_URL = "https://api-inference.huggingface.co/models/google/flan-t5-xxl"
             headers = {"Content-Type": "application/json"}
             # Use a well-formatted prompt
             payload = {
                 "inputs": prompt,
-                "parameters": {"max_length": 200, "temperature": 0.7}
             }
-            response = requests.post(API_URL, headers=headers, json=payload, timeout=10)
             if response.status_code == 200:
                 result = response.json()
@@ -92,12 +97,32 @@ class LLMInterface:
                     return result.get("generated_text", "").strip()
                 else:
                     return str(result).strip()
             else:
-                # Fallback for rate limits or API issues
-                return "The model is currently unavailable. Please try again later."
         except Exception as e:
-            return f"Error: {str(e)}"
 # --- Advanced Agent Implementation ---
 class BasicAgent:
@@ -218,39 +243,60 @@ class BasicAgent:
         return search_result
     def _get_answer_from_llm(self, question: str) -> str:
-        """Get an answer from the LLM with appropriate prompting"""
-        prompt = f"""
-        Answer the following question with a very concise, direct response:
-        Question: {question}
-        Answer in 1-2 sentences maximum, focusing only on the specific information requested.
-        """
-        # Simple responses for common questions to avoid LLM latency
-        common_answers = {
-            "what color is the sky": "Blue.",
-            "how many days in a week": "7 days.",
-            "how many months in a year": "12 months.",
-            "what is the capital of france": "Paris.",
-            "what is the capital of japan": "Tokyo.",
-            "what is the capital of italy": "Rome.",
-            "what is the capital of germany": "Berlin.",
-            "what is the capital of spain": "Madrid.",
-            "what is water made of": "H2O (hydrogen and oxygen).",
-            "who wrote romeo and juliet": "William Shakespeare.",
-            "who painted the mona lisa": "Leonardo da Vinci.",
-            "what is the largest ocean": "The Pacific Ocean.",
-            "what is the smallest planet": "Mercury."
-        }
-        # Check if we have a hardcoded answer
-        for key, answer in common_answers.items():
-            if question.lower().strip('?').strip() == key:
                 return answer
-        # If no hardcoded answer, use the LLM
-        return self.llm.query_llm(prompt)
 def run_and_submit_all(profile: gr.OAuthProfile | None):
     """

     def query_llm(prompt: str) -> str:
         """Query a free LLM through Hugging Face's inference API"""
         try:
+            # Using a smaller, more reliable free model
+            API_URL = "https://api-inference.huggingface.co/models/facebook/bart-large-cnn"
+            # Alternative models you can try if this one doesn't work:
+            # - "distilbert-base-uncased-finetuned-sst-2-english"
+            # - "gpt2"
+            # - "microsoft/DialoGPT-medium"
             headers = {"Content-Type": "application/json"}
             # Use a well-formatted prompt
             payload = {
                 "inputs": prompt,
+                "parameters": {"max_length": 100, "do_sample": False}
             }
+            response = requests.post(API_URL, headers=headers, json=payload, timeout=30)
             if response.status_code == 200:
                 result = response.json()
                     return result.get("generated_text", "").strip()
                 else:
                     return str(result).strip()
+            elif response.status_code == 503:
+                # Model is loading
+                return "I need more time to think about this. The model is currently loading."
             else:
+                # Fallback for other API issues
+                return "I don't have enough information to answer that question precisely."
+        except requests.exceptions.Timeout:
+            return "The model is taking too long to respond. Let me give a simpler answer instead."
         except Exception as e:
+            # More robust fallback system with common answers
+            common_answers = {
+                "population": "The current world population is approximately 8 billion people.",
+                "capital": "I can tell you about many capitals. For example, Paris is the capital of France.",
+                "math": "I can help with mathematical calculations.",
+                "weather": "I don't have access to current weather information.",
+                "date": "I can tell you that a day has 24 hours.",
+                "time": "I can't check the current time."
+            }
+            # Check if any keywords match
+            for keyword, answer in common_answers.items():
+                if keyword in prompt.lower():
+                    return answer
+            return "I'm sorry, I couldn't process that request properly. Please try asking in a simpler way."
 # --- Advanced Agent Implementation ---
 class BasicAgent:
         return search_result
     def _get_answer_from_llm(self, question: str) -> str:
+    """Get an answer from the LLM with appropriate prompting"""
+    prompt = f"""
+    Answer the following question with a very concise, direct response:
+    Question: {question}
+    Answer in 1-2 sentences maximum, focusing only on the specific information requested.
+    """
+    # Expanded common answers to reduce LLM API dependence
+    common_answers = {
+        "what color is the sky": "Blue.",
+        "how many days in a week": "7 days.",
+        "how many months in a year": "12 months.",
+        "what is the capital of france": "Paris.",
+        "what is the capital of japan": "Tokyo.",
+        "what is the capital of italy": "Rome.",
+        "what is the capital of germany": "Berlin.",
+        "what is the capital of spain": "Madrid.",
+        "what is the capital of united states": "Washington, D.C.",
+        "what is the capital of china": "Beijing.",
+        "what is the capital of russia": "Moscow.",
+        "what is the capital of canada": "Ottawa.",
+        "what is the capital of australia": "Canberra.",
+        "what is the capital of brazil": "Brasília.",
+        "what is water made of": "H2O (hydrogen and oxygen).",
+        "who wrote romeo and juliet": "William Shakespeare.",
+        "who painted the mona lisa": "Leonardo da Vinci.",
+        "what is the largest ocean": "The Pacific Ocean.",
+        "what is the smallest planet": "Mercury.",
+        "what is the largest planet": "Jupiter.",
+        "who invented electricity": "Electricity wasn't invented but discovered through contributions from many scientists including Benjamin Franklin, Michael Faraday, and Thomas Edison.",
+        "how many continents are there": "There are 7 continents: Africa, Antarctica, Asia, Europe, North America, Australia/Oceania, and South America.",
+        "what is the largest country": "Russia is the largest country by land area.",
+        "what is the most spoken language": "Mandarin Chinese is the most spoken native language in the world.",
+        "what is the tallest mountain": "Mount Everest is the tallest mountain above sea level at 8,848.86 meters."
+    }
+    # Clean up the question for better matching
+    clean_question = question.lower().strip('?').strip()
+    # Check if we have a hardcoded answer
+    if clean_question in common_answers:
+        return common_answers[clean_question]
+    # Try partial matching for more flexibility
+    for key, answer in common_answers.items():
+        if clean_question in key or key in clean_question:
+            # Only return if it's a close match
+            if len(clean_question) > len(key) * 0.7 or len(key) > len(clean_question) * 0.7:
                 return answer
+    # If no hardcoded answer, use the LLM
+    return self.llm.query_llm(prompt)
 def run_and_submit_all(profile: gr.OAuthProfile | None):
     """