zoya23 commited on
Commit
d548b01
·
verified ·
1 Parent(s): 802471d

Update agents/language_agent.py

Browse files
Files changed (1) hide show
  1. agents/language_agent.py +15 -6
agents/language_agent.py CHANGED
@@ -1,8 +1,17 @@
1
- from transformers import pipeline
 
 
2
 
3
- # Load once at module level
4
- summarizer = pipeline("summarization", model="google/flan-t5-small")
 
 
 
 
 
5
 
6
- def generate_brief(text):
7
- response = summarizer(text, max_length=80, min_length=20, do_sample=False)
8
- return response[0]['summary_text']
 
 
 
1
+ from langchain.llms import CTransformers
2
+ from langchain.chains import RetrievalQA
3
+ from agents.retriever_agent import create_vectorstore
4
 
5
+ def generate_brief(question):
6
+ # Load a local quantized model (no key)
7
+ llm = CTransformers(
8
+ model="models/mistral-7b-instruct-v0.1.Q4_K_M.gguf", # Or use t5-small with transformers
9
+ model_type="mistral",
10
+ config={'max_new_tokens': 512, 'temperature': 0.7}
11
+ )
12
 
13
+ vectordb = create_vectorstore()
14
+ retriever = vectordb.as_retriever()
15
+
16
+ qa_chain = RetrievalQA.from_chain_type(llm=llm, retriever=retriever)
17
+ return qa_chain.run(question)