Spaces:

sibthinon
/

environment

Running

App Files Files Community

sibthinon commited on May 22

Commit

49c543f

verified ·

1 Parent(s): 1b71a8f

add fuzzy

Browse files

Files changed (1) hide show

app.py +35 -18

app.py CHANGED Viewed

@@ -6,11 +6,14 @@ from sentence_transformers import SentenceTransformer
 from qdrant_client import QdrantClient
 from qdrant_client.models import Filter, FieldCondition, MatchValue
 import os
 qdrant_client = QdrantClient(
-    url=os.environ.get("Qdrant_url"),
-    api_key=os.environ.get("Qdrant_api"),
 )
 # โมเดลที่โหลดล่วงหน้า
@@ -39,6 +42,16 @@ model_config = {
 # Global memory to hold feedback state
 latest_query_result = {"query": "", "result": "", "model": ""}
 # 🌟 Main search function
 def search_product(query, model_name):
     start_time = time.time()
@@ -46,35 +59,39 @@ def search_product(query, model_name):
     if model_name not in model_config:
         return "❌ ไม่พบโมเดล"
-    query_embed = model_config[model_name]["func"](query)
     collection_name = model_config[model_name]["collection"]
-    # Query Qdrant
     try:
-      result = qdrant_client.query_points(
-          collection_name=collection_name,
-          query=query_embed.tolist(),
-          with_payload=True,
-          query_filter=Filter(
-              must=[FieldCondition(key="type", match=MatchValue(value="product"))]
-          )
-      ).points
     except Exception as e:
-      return f"❌ Qdrant error: {str(e)}"
     elapsed = time.time() - start_time
-    # Format result
-    output = f"⏱ Time: {elapsed:.2f}s\n\n📦 ผลลัพธ์:\n"
     result_summary = ""
     for res in result:
         line = f"- {res.payload.get('name', '')} (score: {res.score:.4f})"
         output += line + "\n"
         result_summary += line + " | "
-    # Save latest query
-    latest_query_result["query"] = query
     latest_query_result["result"] = result_summary.strip()
     latest_query_result["model"] = model_name

 from qdrant_client import QdrantClient
 from qdrant_client.models import Filter, FieldCondition, MatchValue
 import os
+from symspellpy.symspellpy import SymSpell, Verbosity
 qdrant_client = QdrantClient(
+    #url=os.environ.get("Qdrant_url"),
+    #api_key=os.environ.get("Qdrant_api"),
+    url=userdata.get("Qdrant_url"),
+    api_key=userdata.get("Qdrant_api"),
 )
 # โมเดลที่โหลดล่วงหน้า
 # Global memory to hold feedback state
 latest_query_result = {"query": "", "result": "", "model": ""}
+symspell = SymSpell(max_dictionary_edit_distance=2)
+symspell.load_dictionary("symspell_dict_pythainlp.txt", term_index=0, count_index=1)
+# แก้คำผิด
+def correct_query_with_symspell(query: str) -> str:
+    suggestions = symspell.lookup_compound(query, Verbosity.CLOSEST, max_edit_distance=2)
+    if suggestions:
+        return suggestions[0].term
+    return query
 # 🌟 Main search function
 def search_product(query, model_name):
     start_time = time.time()
     if model_name not in model_config:
         return "❌ ไม่พบโมเดล"
+    # ✨ แทรกขั้นตอน fuzzy correction
+    corrected_query = correct_query_with_symspell(query)
+    query_embed = model_config[model_name]["func"](corrected_query)
     collection_name = model_config[model_name]["collection"]
     try:
+        result = qdrant_client.query_points(
+            collection_name=collection_name,
+            query=query_embed.tolist(),
+            with_payload=True,
+            query_filter=Filter(
+                must=[FieldCondition(key="type", match=MatchValue(value="product"))]
+            ),
+            limit=10
+        ).points
     except Exception as e:
+        return f"❌ Qdrant error: {str(e)}"
     elapsed = time.time() - start_time
+    output = f"⏱ Time: {elapsed:.2f}s\n"
+    if corrected_query != query:
+        output += f"🔧 แก้คำค้นจาก: `{query}` → `{corrected_query}`\n\n"
+    output += f"📦 ผลลัพธ์:\n"
     result_summary = ""
     for res in result:
         line = f"- {res.payload.get('name', '')} (score: {res.score:.4f})"
         output += line + "\n"
         result_summary += line + " | "
+    latest_query_result["query"] = corrected_query
     latest_query_result["result"] = result_summary.strip()
     latest_query_result["model"] = model_name