Spaces:

Priyanshukr-1
/

openhermes_mistral_API

Sleeping

Priyanshukr-1 commited on about 1 month ago

Commit

d9ba98f

verified ·

1 Parent(s): 191a9f9

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -11,8 +11,8 @@ import uuid # For generating unique session IDs
 app = FastAPI()
 # === Model Config ===
-# Switched to TinyLlama-1.1B-Chat-v1.0 for better CPU performance
-REPO_ID = "TinyLlama/TinyLlama-1.1B-Chat-v1.0-GGUF"
 FILENAME = "tinyllama-1.1b-chat-v1.0.Q4_K_M.gguf" # Q4_K_M is a good balance of size and quality
 MODEL_DIR = "models"
 MODEL_PATH = os.path.join(MODEL_DIR, FILENAME)
@@ -185,4 +185,4 @@ async def generate(request: Request):
         # Remove the last user message from history if generation failed to prevent bad state
         if chat_histories[session_id] and chat_histories[session_id][-1]["role"] == "user":
             chat_histories[session_id].pop()
-        return {"error": f"Failed to generate response: {e}. Please try again.", "session_id": session_id}, 500

 app = FastAPI()
 # === Model Config ===
+# Corrected REPO_ID to use TheBloke's GGUF version of TinyLlama
+REPO_ID = "TheBloke/TinyLlama-1.1B-Chat-v1.0-GGUF"
 FILENAME = "tinyllama-1.1b-chat-v1.0.Q4_K_M.gguf" # Q4_K_M is a good balance of size and quality
 MODEL_DIR = "models"
 MODEL_PATH = os.path.join(MODEL_DIR, FILENAME)
         # Remove the last user message from history if generation failed to prevent bad state
         if chat_histories[session_id] and chat_histories[session_id][-1]["role"] == "user":
             chat_histories[session_id].pop()
+        return {"error": f"Failed to generate response: {e}. Please try again.", "session_id": session_id}, 500