gaur3009 commited on
Commit
1262e09
Β·
verified Β·
1 Parent(s): e4c807c

Update llm.py

Browse files
Files changed (1) hide show
  1. llm.py +4 -6
llm.py CHANGED
@@ -1,12 +1,10 @@
1
- # llm.py
2
- from transformers import AutoModelForCausalLM, AutoTokenizer
3
 
4
- # load model once
5
  tokenizer = AutoTokenizer.from_pretrained("distilgpt2")
6
  model = AutoModelForCausalLM.from_pretrained("distilgpt2")
7
 
8
  def generate_answer(context, question):
9
  prompt = f"Context:\n{context}\n\nQuestion: {question}\nAnswer:"
10
- inputs = tokenizer.encode(prompt, return_tensors='pt', max_length=1024, truncation=True)
11
- outputs = model.generate(inputs, max_new_tokens=50, do_sample=True)
12
- return tokenizer.decode(outputs[0], skip_special_tokens=True).strip()
 
1
+ from transformers import AutoTokenizer, AutoModelForCausalLM
 
2
 
 
3
  tokenizer = AutoTokenizer.from_pretrained("distilgpt2")
4
  model = AutoModelForCausalLM.from_pretrained("distilgpt2")
5
 
6
  def generate_answer(context, question):
7
  prompt = f"Context:\n{context}\n\nQuestion: {question}\nAnswer:"
8
+ inputs = tokenizer.encode(prompt, return_tensors='pt', truncation=True, max_length=1024)
9
+ outputs = model.generate(inputs, max_new_tokens=60, do_sample=True, pad_token_id=tokenizer.eos_token_id)
10
+ return tokenizer.decode(outputs[0], skip_special_tokens=True).strip()