Spaces:
Paused
Paused
Carlos Rosas
commited on
Update app.py
Browse files
app.py
CHANGED
|
@@ -13,14 +13,6 @@ import pandas as pd
|
|
| 13 |
# Define the device
|
| 14 |
device = "cuda" if torch.cuda.is_available() else "cpu"
|
| 15 |
|
| 16 |
-
# Define variables
|
| 17 |
-
temperature = 0.0
|
| 18 |
-
max_new_tokens = 1500
|
| 19 |
-
top_p = 0.95
|
| 20 |
-
repetition_penalty = 1.0
|
| 21 |
-
min_new_tokens = 800
|
| 22 |
-
early_stopping = False
|
| 23 |
-
|
| 24 |
model_name = "PleIAs/Pleias-Rag"
|
| 25 |
|
| 26 |
# Get Hugging Face token from environment variable
|
|
@@ -34,9 +26,19 @@ model = AutoModelForCausalLM.from_pretrained(model_name, token=hf_token)
|
|
| 34 |
model.to(device)
|
| 35 |
|
| 36 |
# Set tokenizer configuration
|
| 37 |
-
|
| 38 |
-
tokenizer.pad_token_id = tokenizer.eos_token_id
|
| 39 |
tokenizer.eos_token = "<|answer_end|>"
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 40 |
|
| 41 |
# Connect to the LanceDB database
|
| 42 |
db = lancedb.connect("content 5/lancedb_data")
|
|
|
|
| 13 |
# Define the device
|
| 14 |
device = "cuda" if torch.cuda.is_available() else "cpu"
|
| 15 |
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 16 |
model_name = "PleIAs/Pleias-Rag"
|
| 17 |
|
| 18 |
# Get Hugging Face token from environment variable
|
|
|
|
| 26 |
model.to(device)
|
| 27 |
|
| 28 |
# Set tokenizer configuration
|
| 29 |
+
|
|
|
|
| 30 |
tokenizer.eos_token = "<|answer_end|>"
|
| 31 |
+
eos_token_id=tokenizer.eos_token_id
|
| 32 |
+
tokenizer.pad_token = tokenizer.eos_token
|
| 33 |
+
tokenizer.pad_token_id = 1
|
| 34 |
+
|
| 35 |
+
# Define variables
|
| 36 |
+
temperature = 0.0
|
| 37 |
+
max_new_tokens = 1500
|
| 38 |
+
top_p = 0.95
|
| 39 |
+
repetition_penalty = 1.0
|
| 40 |
+
min_new_tokens = 800
|
| 41 |
+
early_stopping = False
|
| 42 |
|
| 43 |
# Connect to the LanceDB database
|
| 44 |
db = lancedb.connect("content 5/lancedb_data")
|