grant_rag_system

Running

Tesneem commited on 17 days ago

Commit

d7880e6

verified ·

1 Parent(s): 9502853

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -70,19 +70,24 @@ def format_docs(docs: List[Document]) -> str:
 # =================== Generate Response from Hugging Face Model ===================
 def generate_response(input_dict: Dict[str, Any]) -> str:
-    client = InferenceClient(api_key=HF_TOKEN)
     prompt = grantbuddy_prompt.format(**input_dict)
-    response = client.chat.completions.create(
-        model="Qwen/Qwen2.5-1.5B-Instruct",
-        messages=[
-            {"role": "system", "content": prompt},
-            {"role": "user", "content": input_dict["question"]},
-        ],
-        max_tokens=1000,
-        temperature=0.2,
-    )
-    return response.choices[0].message.content
 # =================== RAG Chain ===================
 def get_rag_chain(retriever):

 # =================== Generate Response from Hugging Face Model ===================
 def generate_response(input_dict: Dict[str, Any]) -> str:
+    client = InferenceClient(api_key=HF_TOKEN.strip())
     prompt = grantbuddy_prompt.format(**input_dict)
+    try:
+        response = client.chat.completions.create(
+            model="Qwen/Qwen2.5-1.5B-Instruct",
+            messages=[
+                {"role": "system", "content": prompt},
+                {"role": "user", "content": input_dict["question"]},
+            ],
+            max_tokens=1000,
+            temperature=0.2,
+        )
+        return response.choices[0].message.content
+    except Exception as e:
+        st.error(f"❌ Error from model: {e}")
+        return "⚠️ Failed to generate response. Please check your model, HF token, or request format."
 # =================== RAG Chain ===================
 def get_rag_chain(retriever):