Spaces:

OuroborosM
/

STLA-BABY

Runtime error

App Files Files Community

STLA-BABY / app.py

OuroborosM

add error tracking function

d80c981 almost 2 years ago

raw

history blame

7.62 kB

	from typing import Any, Coroutine
	import openai
	import os
	from langchain.vectorstores import Chroma
	from langchain.embeddings.openai import OpenAIEmbeddings
	from langchain.text_splitter import CharacterTextSplitter
	from langchain.chat_models import AzureChatOpenAI
	from langchain.document_loaders import DirectoryLoader
	from langchain.chains import RetrievalQA
	from langchain.vectorstores import Pinecone
	from langchain.agents import initialize_agent
	from langchain.agents import AgentType
	from langchain.agents import tool
	from langchain.tools import BaseTool

	import pinecone
	from pinecone.core.client.configuration import Configuration as OpenApiConfiguration
	import gradio as gr
	import time

	class DB_Search(BaseTool):
	name = "Vector Database Search"
	description = "This is the vector database to search local information"
	def _run(self, query: str) -> str:
	response, source = QAQuery_p(query)
	# response = "test db_search feedback"
	return response

	def _arun(self, query: str):
	raise NotImplementedError("N/A")

	tools = [DB_Search()]



	os.environ["OPENAI_API_TYPE"] = "azure"
	os.environ["OPENAI_API_KEY"] = os.getenv("OPENAI_API_KEY")
	os.environ["OPENAI_API_BASE"] = os.getenv("OPENAI_API_BASE")
	os.environ["OPENAI_API_VERSION"] = "2023-05-15"
	username = os.getenv("username")
	password = os.getenv("password")
	SysLock = os.getenv("SysLock") # 0=unlock 1=lock

	chat = AzureChatOpenAI(
	deployment_name="Chattester",
	temperature=0,
	)

	embeddings = OpenAIEmbeddings(deployment="model_embedding", chunk_size=15)


	pinecone.init(
	api_key = os.getenv("pinecone_api_key"),
	environment='asia-southeast1-gcp-free',
	# openapi_config=openapi_config
	)
	index_name = 'stla-baby'
	index = pinecone.Index(index_name)
	# index.delete(delete_all=True, namespace='')
	# print(pinecone.whoami())
	# print(index.describe_index_stats())

	llm = chat
	agent = initialize_agent(tools, llm,
	agent=AgentType.ZERO_SHOT_REACT_DESCRIPTION,
	verbose = True,
	handle_parsing_errors = True)

	global vectordb
	vectordb = Chroma(persist_directory='db', embedding_function=embeddings)
	global vectordb_p
	vectordb_p = Pinecone.from_existing_index(index_name, embeddings)

	# loader = DirectoryLoader('./documents', glob='*/.txt')
	# documents = loader.load()
	# text_splitter = CharacterTextSplitter(chunk_size=500, chunk_overlap=200)
	# split_docs = text_splitter.split_documents(documents)
	# print(split_docs)
	# vectordb = Chroma.from_documents(split_docs, embeddings, persist_directory='db')



	# question = "what is LCDV ?"
	# rr = vectordb.similarity_search(query=question, k=4)
	# vectordb.similarity_search(question)
	# print(type(rr))
	# print(rr)
	def chathmi(message, history):
	# response = "I don't know"
	# print(message)
	response, source = QAQuery_p(message)
	time.sleep(0.3)
	print(history)
	yield response
	# yield history

	def chathmi2(message, history):
	try:
	output = agent.run(message)
	time.sleep(0.3)
	print("History: ", history)
	response = output
	yield response
	except Exception as e:
	print("error:", e)

	# yield history
	# chatbot = gr.Chatbot().style(color_map =("blue", "pink"))
	# chatbot = gr.Chatbot(color_map =("blue", "pink"))

	demo = gr.ChatInterface(
	chathmi2,
	title="STLA BABY - YOUR FRIENDLY GUIDE ",
	description= "v0.2: Powered by MECH Core Team",
	)

	# demo = gr.Interface(
	# chathmi,
	# ["text", "state"],
	# [chatbot, "state"],
	# allow_flagging="never",
	# )

	def CreatDb_P():
	global vectordb_p
	index_name = 'stla-baby'
	loader = DirectoryLoader('./documents', glob='*/.txt')
	documents = loader.load()
	text_splitter = CharacterTextSplitter(chunk_size=500, chunk_overlap=200)
	split_docs = text_splitter.split_documents(documents)
	print(split_docs)
	pinecone.Index(index_name).delete(delete_all=True, namespace='')
	vectordb_p = Pinecone.from_documents(split_docs, embeddings, index_name = "stla-baby")
	print("Pinecone Updated Done")
	print(index.describe_index_stats())

	def QAQuery_p(question: str):
	global vectordb_p
	# vectordb = Chroma(persist_directory='db', embedding_function=embeddings)
	retriever = vectordb_p.as_retriever()
	retriever.search_kwargs['k'] = int(os.getenv("search_kwargs_k"))
	# retriever.search_kwargs['fetch_k'] = 100

	qa = RetrievalQA.from_chain_type(llm=chat, chain_type="stuff",
	retriever=retriever, return_source_documents = True,
	verbose = True)
	# qa = VectorDBQA.from_chain_type(llm=chat, chain_type="stuff", vectorstore=vectordb, return_source_documents=True)
	# res = qa.run(question)
	res = qa({"query": question})

	print("-" * 20)
	print("Question:", question)
	# print("Answer:", res)
	print("Answer:", res['result'])
	print("-" * 20)
	print("Source:", res['source_documents'])
	response = res['result']
	# response = res['source_documents']
	source = res['source_documents']
	return response, source

	def CreatDb():
	global vectordb
	loader = DirectoryLoader('./documents', glob='*/.txt')
	documents = loader.load()
	text_splitter = CharacterTextSplitter(chunk_size=500, chunk_overlap=200)
	split_docs = text_splitter.split_documents(documents)
	print(split_docs)
	vectordb = Chroma.from_documents(split_docs, embeddings, persist_directory='db')
	vectordb.persist()

	def QAQuery(question: str):
	global vectordb
	# vectordb = Chroma(persist_directory='db', embedding_function=embeddings)
	retriever = vectordb.as_retriever()
	retriever.search_kwargs['k'] = 3
	# retriever.search_kwargs['fetch_k'] = 100

	qa = RetrievalQA.from_chain_type(llm=chat, chain_type="stuff", retriever=retriever, return_source_documents = True)
	# qa = VectorDBQA.from_chain_type(llm=chat, chain_type="stuff", vectorstore=vectordb, return_source_documents=True)
	# res = qa.run(question)
	res = qa({"query": question})

	print("-" * 20)
	print("Question:", question)
	# print("Answer:", res)
	print("Answer:", res['result'])
	print("-" * 20)
	print("Source:", res['source_documents'])
	response = res['result']
	return response

	# Used to complete content
	def completeText(Text):
	deployment_id="Chattester"
	prompt = Text
	completion = openai.Completion.create(deployment_id=deployment_id,
	prompt=prompt, temperature=0)
	print(f"{prompt}{completion['choices'][0]['text']}.")

	# Used to chat
	def chatText(Text):
	deployment_id="Chattester"
	conversation = [{"role": "system", "content": "You are a helpful assistant."}]
	user_input = Text
	conversation.append({"role": "user", "content": user_input})
	response = openai.ChatCompletion.create(messages=conversation,
	deployment_id="Chattester")
	print("\n" + response["choices"][0]["message"]["content"] + "\n")

	if __name__ == '__main__':
	# chatText("what is AI?")
	# CreatDb()
	# QAQuery("what is COFOR ?")
	# CreatDb_P()
	# QAQuery_p("what is GST ?")
	if SysLock == "1":
	demo.queue().launch(auth=(username, password))
	else:
	demo.queue().launch()
	pass