Spaces:

Euryeth
/

LLM_Ariphes

Runtime error

Euryeth commited on Jun 8

Commit

e2f4417

verified ·

1 Parent(s): fbbc9c1

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -3,42 +3,44 @@ from transformers import pipeline
 import torch
 import os
-# Set HF token if available in environment (provided via Hugging Face Spaces Secrets)
-# This is CRITICAL to access gated models like Mistral-7B-Instruct-v0.2
 from huggingface_hub import login
-login(os.getenv("HUGGINGFACEHUB_API_TOKEN"))  # automatically handles secrets
-# Use safe float32 for CPU compatibility
 torch_dtype = torch.float32
-# Configure cache directory
 os.environ['HF_HOME'] = '/tmp/cache'
-# Load the model pipeline
 generator = pipeline(
     "text-generation",
-    model="mistralai/Mistral-7B-Instruct-v0.2",
     device=0 if torch.cuda.is_available() else -1,
     torch_dtype=torch_dtype
 )
 def generate_chat_completion(message, history):
-    """Basic chatbot for Gradio interface"""
     prompt = f"User: {message}\nAssistant:"
     output = generator(
         prompt,
-        max_new_tokens=512,
-        temperature=0.8,
-        top_p=0.95,
-        repetition_penalty=1.15,
         do_sample=True
     )
     response = output[0]['generated_text'].replace(prompt, "").strip()
     return response
-gr.ChatInterface(fn=generate_chat_completion,
-                 title="Mistral Chatbot",
-                 description="Chat with Mistral-7B",
-                 retry_btn="Retry",
-                 undo_btn="Undo",
-                 clear_btn="Clear").launch()

 import torch
 import os
+# Login using Hugging Face token from environment variable (set via Secrets)
 from huggingface_hub import login
+login(os.getenv("HUGGINGFACEHUB_API_TOKEN"))
+# Use float32 for CPU/GPU compatibility
 torch_dtype = torch.float32
+# Set Hugging Face cache dir (optional but helps in Spaces)
 os.environ['HF_HOME'] = '/tmp/cache'
+# Load Falcon 1B Instruct model pipeline
 generator = pipeline(
     "text-generation",
+    model="tiiuae/falcon-rw-1b-instruct",
     device=0 if torch.cuda.is_available() else -1,
     torch_dtype=torch_dtype
 )
 def generate_chat_completion(message, history):
+    """Simple chatbot logic"""
     prompt = f"User: {message}\nAssistant:"
     output = generator(
         prompt,
+        max_new_tokens=256,
+        temperature=0.9,
+        top_p=0.9,
+        repetition_penalty=1.1,
         do_sample=True
     )
     response = output[0]['generated_text'].replace(prompt, "").strip()
     return response
+# Gradio chat interface
+gr.ChatInterface(
+    fn=generate_chat_completion,
+    title="Falcon Chatbot",
+    description="Roleplay-ready chat using Falcon-1B-Instruct",
+    retry_btn="Retry",
+    undo_btn="Undo",
+    clear_btn="Clear"
+).launch()