Spaces:

diginoron
/

tiyam-chatbot

Sleeping

App Files Files Community

diginoron commited on May 19

Commit

5c06db1

verified ·

1 Parent(s): 7ba95e9

Update app.py

Browse files

Files changed (1) hide show

app.py +31 -17

app.py CHANGED Viewed

@@ -1,23 +1,29 @@
 import os
 import json
 import gradio as gr
 import openai
 from sentence_transformers import SentenceTransformer
 from pinecone import Pinecone, ServerlessSpec
 openai.api_key = os.getenv("openai")
 model = SentenceTransformer('paraphrase-multilingual-MiniLM-L12-v2')
 with open("tiyam_qa_data.json", "r", encoding="utf-8") as f:
     data = json.load(f)
-api_key = os.getenv("PINECONE_API_KEY")
-region = os.getenv("PINECONE_ENVIRONMENT", "us-west1-gcp")
-index_name = os.getenv("PINECONE_INDEX_NAME", "tiyam-chat")
 pc = Pinecone(api_key=api_key)
 existing_indexes = pc.list_indexes().names()
 if index_name not in existing_indexes:
     pc.create_index(
@@ -29,25 +35,29 @@ if index_name not in existing_indexes:
             region=region
         )
     )
 index = pc.Index(index_name)
-def retrieve_answer(query, threshold=0.4, top_k=1):  # <-- کاهش threshold به 0.6
     query_embedding = model.encode([query])[0]
     result = index.query(vector=query_embedding.tolist(), top_k=top_k, include_metadata=True)
     try:
         result_dict = result.to_dict()
     except Exception:
         result_dict = str(result)
     print("=== Pinecone query result ===")
     if isinstance(result_dict, dict):
         print(json.dumps(result_dict, indent=2, ensure_ascii=False))
     else:
         print(result_dict)
     print("============================")
     if hasattr(result, 'matches') and result.matches and len(result.matches) > 0 and result.matches[0].score > threshold:
         metadata = result.matches[0].metadata
         print("Matched answer:", metadata.get('answer'))
@@ -59,23 +69,27 @@ def retrieve_answer(query, threshold=0.4, top_k=1):  # <-- کاهش threshold ب
 def generate_human_response(context_text):
     if not context_text:
         return "متأسفم، پاسخ دقیقی برای این سوال نداریم. لطفاً با ما تماس بگیرید."
     prompt = (
         f"این متن پاسخ سوال مشتری است: \"{context_text}\".\n"
-        "لطفاً یک پاسخ کوتاه، رسمی و کاملاً مختصر و مفید به زبان فارسی تولید کن که فقط بر اساس همین متن باشد و هیچ اطلاعات اضافی نده."
     )
     try:
         response = openai.chat.completions.create(
-            model="gpt-4",
             messages=[
                 {"role": "system", "content": "شما یک پاسخگوی رسمی شرکت هستید."},
                 {"role": "user", "content": prompt}
             ],
             temperature=0.2,
-            max_tokens=100,
         )
-        return response.choices[0].message.content.strip()
     except Exception as e:
         print("OpenAI API error:", e)
         return "خطا در پردازش درخواست."
@@ -94,4 +108,4 @@ demo = gr.Interface(
 )
 if __name__ == "__main__":
-    demo.launch()

+import pandas as pd
+import numpy as np
 import os
+import sys
 import json
+import pickle
 import gradio as gr
 import openai
 from sentence_transformers import SentenceTransformer
 from pinecone import Pinecone, ServerlessSpec
+# تنظیم کلیدهای API
 openai.api_key = os.getenv("openai")
+api_key = os.getenv("PINECONE_API_KEY")
+region = os.getenv("PINECONE_ENVIRONMENT", "us-west1-gcp")
+index_name = os.getenv("PINECONE_INDEX_NAME", "tiyam-chat")
+# بارگذاری مدل
 model = SentenceTransformer('paraphrase-multilingual-MiniLM-L12-v2')
+# بارگذاری داده‌ها (در حال حاضر فقط لود می‌شه، باید به Pinecone اضافه بشه)
 with open("tiyam_qa_data.json", "r", encoding="utf-8") as f:
     data = json.load(f)
+# اتصال به Pinecone
 pc = Pinecone(api_key=api_key)
 existing_indexes = pc.list_indexes().names()
 if index_name not in existing_indexes:
     pc.create_index(
             region=region
         )
     )
 index = pc.Index(index_name)
+# سیستم کش
+cache_file = "chat_cache.pkl"
+try:
+    with open(cache_file, "rb") as f:
+        cache = pickle.load(f)
+except FileNotFoundError:
+    cache = {}
+def retrieve_answer(query, threshold=0.6, top_k=1):  # افزایش threshold به 0.6
     query_embedding = model.encode([query])[0]
     result = index.query(vector=query_embedding.tolist(), top_k=top_k, include_metadata=True)
     try:
         result_dict = result.to_dict()
     except Exception:
         result_dict = str(result)
     print("=== Pinecone query result ===")
     if isinstance(result_dict, dict):
         print(json.dumps(result_dict, indent=2, ensure_ascii=False))
     else:
         print(result_dict)
     print("============================")
     if hasattr(result, 'matches') and result.matches and len(result.matches) > 0 and result.matches[0].score > threshold:
         metadata = result.matches[0].metadata
         print("Matched answer:", metadata.get('answer'))
 def generate_human_response(context_text):
     if not context_text:
         return "متأسفم، پاسخ دقیقی برای این سوال نداریم. لطفاً با ما تماس بگیرید."
+    if context_text in cache:
+        return cache[context_text]
     prompt = (
         f"این متن پاسخ سوال مشتری است: \"{context_text}\".\n"
+        "لطفاً یک پاسخ کوتاه، رسمی و کاملاً مختصر و مفید به زبان فارسی تولید کن که فقط بر اساس همین متن باشد."
     )
     try:
         response = openai.chat.completions.create(
+            model="gpt-3.5-turbo",  # مدل ارزان‌تر
             messages=[
                 {"role": "system", "content": "شما یک پاسخگوی رسمی شرکت هستید."},
                 {"role": "user", "content": prompt}
             ],
             temperature=0.2,
+            max_tokens=50,  # کاهش توکن‌ها
         )
+        answer = response.choices[0].message.content.strip()
+        cache[context_text] = answer
+        with open(cache_file, "wb") as f:
+            pickle.dump(cache, f)
+        return answer
     except Exception as e:
         print("OpenAI API error:", e)
         return "خطا در پردازش درخواست."
 )
 if __name__ == "__main__":
+    demo.launch()