Spaces:
Runtime error
Runtime error
Update llm.py
Browse files
llm.py
CHANGED
@@ -1,12 +1,10 @@
|
|
1 |
-
|
2 |
-
from transformers import AutoModelForCausalLM, AutoTokenizer
|
3 |
|
4 |
-
# load model once
|
5 |
tokenizer = AutoTokenizer.from_pretrained("distilgpt2")
|
6 |
model = AutoModelForCausalLM.from_pretrained("distilgpt2")
|
7 |
|
8 |
def generate_answer(context, question):
|
9 |
prompt = f"Context:\n{context}\n\nQuestion: {question}\nAnswer:"
|
10 |
-
inputs = tokenizer.encode(prompt, return_tensors='pt',
|
11 |
-
outputs = model.generate(inputs, max_new_tokens=
|
12 |
-
return tokenizer.decode(outputs[0], skip_special_tokens=True).strip()
|
|
|
1 |
+
from transformers import AutoTokenizer, AutoModelForCausalLM
|
|
|
2 |
|
|
|
3 |
tokenizer = AutoTokenizer.from_pretrained("distilgpt2")
|
4 |
model = AutoModelForCausalLM.from_pretrained("distilgpt2")
|
5 |
|
6 |
def generate_answer(context, question):
|
7 |
prompt = f"Context:\n{context}\n\nQuestion: {question}\nAnswer:"
|
8 |
+
inputs = tokenizer.encode(prompt, return_tensors='pt', truncation=True, max_length=1024)
|
9 |
+
outputs = model.generate(inputs, max_new_tokens=60, do_sample=True, pad_token_id=tokenizer.eos_token_id)
|
10 |
+
return tokenizer.decode(outputs[0], skip_special_tokens=True).strip()
|