Spaces:

CCockrum
/

NASA-AI-Chatbot

Sleeping

CCockrum commited on Mar 10

Commit

edd5165

verified ·

1 Parent(s): 30d38df

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -34,7 +34,7 @@ if "follow_up" not in st.session_state:
     st.session_state.follow_up = ""
 # ✅ Initialize Hugging Face Model (Explicitly Set to CPU/GPU)
-def get_llm_hf_inference(model_id="meta-llama/Llama-2-7b-chat-hf", max_new_tokens=800, temperature=0.8):
     #mistralai/Mistral-7B-Instruct-v0.3
     return HuggingFaceEndpoint(
         repo_id=model_id,
@@ -91,7 +91,7 @@ def generate_follow_up(user_text):
         "Ensure it's concise and structured exactly as requested without extra commentary."
     )
-    hf = get_llm_hf_inference(max_new_tokens=30, temperature=0.8)  # 🔥 Lower temp for consistency
     output = hf.invoke(input=prompt_text).strip()
     # ✅ Extract the relevant part using regex to remove unwanted symbols or truncations
@@ -120,7 +120,7 @@ def get_response(system_message, chat_history, user_text, max_new_tokens=800):
         return response, follow_up, chat_history, nasa_url
     # ✅ Invoke Hugging Face Model
-    hf = get_llm_hf_inference(max_new_tokens=max_new_tokens, temperature=0.9)
     filtered_history = "\n".join(f"{msg['role']}: {msg['content']}" for msg in chat_history)

     st.session_state.follow_up = ""
 # ✅ Initialize Hugging Face Model (Explicitly Set to CPU/GPU)
+def get_llm_hf_inference(model_id="meta-llama/Llama-2-7b-chat-hf", max_new_tokens=800, temperature=0.7):
     #mistralai/Mistral-7B-Instruct-v0.3
     return HuggingFaceEndpoint(
         repo_id=model_id,
         "Ensure it's concise and structured exactly as requested without extra commentary."
     )
+    hf = get_llm_hf_inference(max_new_tokens=30, temperature=0.3)  # 🔥 Lower temp for consistency
     output = hf.invoke(input=prompt_text).strip()
     # ✅ Extract the relevant part using regex to remove unwanted symbols or truncations
         return response, follow_up, chat_history, nasa_url
     # ✅ Invoke Hugging Face Model
+    hf = get_llm_hf_inference(max_new_tokens=max_new_tokens, temperature=0.7)
     filtered_history = "\n".join(f"{msg['role']}: {msg['content']}" for msg in chat_history)