Spaces:

k3ybladewielder
/

cloudwalk_chatbot

Sleeping

App Files Files Community

k3ybladewielder commited on Jul 15

Commit

1768992

verified ·

1 Parent(s): 7cb2abd

Update app.py

Browse files

Files changed (1) hide show

app.py +155 -60

app.py CHANGED Viewed

@@ -1,64 +1,159 @@
-import gradio as gr
-from huggingface_hub import InferenceClient
-"""
-For more information on `huggingface_hub` Inference API support, please check the docs: https://huggingface.co/docs/huggingface_hub/v0.22.2/en/guides/inference
-"""
-client = InferenceClient("HuggingFaceH4/zephyr-7b-beta")
-def respond(
-    message,
-    history: list[tuple[str, str]],
-    system_message,
-    max_tokens,
-    temperature,
-    top_p,
-):
-    messages = [{"role": "system", "content": system_message}]
-    for val in history:
-        if val[0]:
-            messages.append({"role": "user", "content": val[0]})
-        if val[1]:
-            messages.append({"role": "assistant", "content": val[1]})
-    messages.append({"role": "user", "content": message})
-    response = ""
-    for message in client.chat_completion(
-        messages,
-        max_tokens=max_tokens,
-        stream=True,
-        temperature=temperature,
-        top_p=top_p,
-    ):
-        token = message.choices[0].delta.content
-        response += token
-        yield response
-"""
-For information on how to customize the ChatInterface, peruse the gradio docs: https://www.gradio.app/docs/chatinterface
-"""
-demo = gr.ChatInterface(
-    respond,
-    additional_inputs=[
-        gr.Textbox(value="You are a friendly Chatbot.", label="System message"),
-        gr.Slider(minimum=1, maximum=2048, value=512, step=1, label="Max new tokens"),
-        gr.Slider(minimum=0.1, maximum=4.0, value=0.7, step=0.1, label="Temperature"),
-        gr.Slider(
-            minimum=0.1,
-            maximum=1.0,
-            value=0.95,
-            step=0.05,
-            label="Top-p (nucleus sampling)",
-        ),
-    ],
 )
 if __name__ == "__main__":
-    demo.launch()

+import os
+import yaml
+import gradio as gr # Importe o Gradio
+from langchain_huggingface import ChatHuggingFace
+from langchain_huggingface.llms.huggingface_endpoint import HuggingFaceEndpoint
+from langchain_community.vectorstores import FAISS
+from langchain.chains import RetrievalQA
+from langchain_huggingface.embeddings import HuggingFaceEmbeddings
+from langchain.prompts import PromptTemplate
+# --- CONFIGURAÇÕES DE MODELOS ---
+# LLM_MODEL = 'google/gemma-3-4b-it'
+LLM_MODEL = 'google/gemma-3-1b-it'
+EMBEDDING_MODEL = "sentence-transformers/all-MiniLM-L6-v2"
+# --- CONFIGURAÇÃO DO TOKEN HF ---
+try:
+    with open("../config.yaml", "r") as file:
+        config = yaml.safe_load(file)
+    HF_TOKEN = config.get('HF_TOKEN')
+except FileNotFoundError:
+    print("Arquivo config.yaml não encontrado. Certifique-se de que ele existe e está no diretório correto.")
+    HF_TOKEN = None
+if not HF_TOKEN:
+    print("Token HF não encontrado no config.yaml ou arquivo não existe.")
+    if "HF_TOKEN" not in os.environ:
+        import getpass
+        os.environ["HF_TOKEN"] = getpass.getpass("Por favor, digite seu token da API Hugging Face: ")
+    HF_TOKEN = os.environ["HF_TOKEN"]
+# --- 1. Inicializa o LLM Hugging Face ---
+llm = HuggingFaceEndpoint(
+    repo_id=LLM_MODEL,
+    task="text-generation",
+    max_new_tokens=1024,
+    do_sample=False,
+    repetition_penalty=1.03,
+    huggingfacehub_api_token=HF_TOKEN,
 )
+chat_model = ChatHuggingFace(llm=llm)
+# --- 2. Inicializa os embeddings ---
+embeddings = HuggingFaceEmbeddings(model_name=EMBEDDING_MODEL)
+# --- 3. Carregando a vector store FAISS salva localmente ---
+vector_store_path = '../vector_store/vs_base/'
+try:
+    faiss_store = FAISS.load_local(vector_store_path, embeddings, allow_dangerous_deserialization=True)
+except Exception as e:
+    print(f"Erro ao carregar a vector store FAISS: {e}")
+    print("Verifique se o caminho está correto e se o arquivo não está corrompido.")
+    exit()
+# --- 4. Retriever a partir da vector store (usando similarity como exemplo) ---
+retriever = faiss_store.as_retriever(search_type="similarity", search_kwargs={"k": 10})
+retriever = faiss_store.as_retriever(
+    search_type="mmr",
+    search_kwargs={"k": 5, "fetch_k": 20, "lambda_mult": 0.7}
+)
+# --- 5. PromptTemplate personalizado ---
+custom_prompt_template = """
+You are a useful chatbot for customer service.
+If you don't know the answer, just say that you don't know, don't try to make up an answer.
+ALWAYS RESPONDE IN THE SAME LANGUAGE AS THE INPUT.
+Use the following pieces of context to answer the user's question.
+{context}
+Question: {question}
+Helpful Answer:"""
+# Crie um objeto PromptTemplate a partir da string
+QA_CHAIN_PROMPT = PromptTemplate.from_template(custom_prompt_template)
+# --- 6. Cria uma cadeia de QA que usa o retriever e o modelo ---
+qa_chain = RetrievalQA.from_chain_type(
+    llm=chat_model,
+    chain_type="stuff",
+    retriever=retriever,
+    return_source_documents=True,
+    chain_type_kwargs={"prompt": QA_CHAIN_PROMPT}
+)
+# --- 7. Função principal para a interface do Gradio ---
+# Esta função será chamada pelo Gradio para gerar a resposta.
+# Ela precisa retornar a resposta do chatbot como uma string.
+def chat_response(question: str, history: list): # `history` é um parâmetro obrigatório para gr.ChatInterface
+    """
+    Gera a resposta do chatbot usando o modelo de QA e formata para exibição no Gradio.
+    Args:
+        question (str): A pergunta do usuário.
+        history (list): Histórico de conversas (não usado diretamente aqui, mas necessário para a interface).
+    Returns:
+        str: A resposta formatada do chatbot, incluindo as fontes.
+    """
+    print(f"Recebida pergunta: '{question}'") # Para debug no console
+    try:
+        result = qa_chain.invoke({"query": question})
+        answer = result["result"]
+        sources = result.get("source_documents", [])
+        response_text = f"**Resposta:** {answer}\n\n"
+        if sources:
+            response_text += "**Saiba mais em:**\n"
+            unique_sources = set()
+            source_list_for_printing = []
+            for doc in sources:
+                source_name = doc.metadata.get('source', 'Fonte desconhecida')
+                if source_name not in unique_sources:
+                    unique_sources.add(source_name)
+                    source_list_for_printing.append(source_name)
+            for i, source_name in enumerate(source_list_for_printing):
+                response_text += f"- {i+1}. '{source_name}'\n"
+        else:
+            response_text += "Nenhuma fonte específica foi utilizada para esta resposta.\n"
+        return response_text
+    except Exception as e:
+        error_message = f"Ocorreu um erro ao processar sua pergunta: {e}. Por favor, tente novamente."
+        print(error_message) # Para debug no console
+        return error_message
+# --- 8. Criação da Interface Gradio ---
 if __name__ == "__main__":
+    print("Iniciando a interface Gradio...")
+    # gr.ChatInterface é ideal para interfaces de chatbot
+    demo = gr.ChatInterface(
+        type="messages",
+        fn=chat_response, # A função que processa a pergunta e retorna a resposta
+        title="CloudWalk Chatbot",
+        description="Olá! Estou aqui para responder suas dúvidas.",
+        submit_btn="Enviar Pergunta",
+        examples=[
+            ["What product and services InfinitePay offer ?"],
+            ['What are the fees for the card machine?'],
+            ['How can I order one card machine?'],
+            ["Quais serviços a infinite pay oferece?"],
+            ["Quais as taxas da maquininha?"],
+            ["Como pedir uma maquininha?"],
+        ],
+        chatbot=gr.Chatbot(type="messages")
+    )
+    # Inicia a interface Gradio
+    # `share=True` gera um link público temporário (útil para testes ou demonstrações)
+    # `debug=True` mostra logs detalhados no terminal
+    demo.launch(share=True)