Spaces:

hsuwill000
/

maxtest01

Running

App Files Files Community

hsuwill000 commited on Jul 2

Commit

c58cf79

verified ·

1 Parent(s): fd1afe0

Update app.py

Browse files

Files changed (1) hide show

app.py +46 -3

app.py CHANGED Viewed

@@ -5,6 +5,22 @@ import threading
 import time
 from optimum.intel import OVModelForCausalLM, OVWeightQuantizationConfig
 import nncf
 import huggingface_hub as hf_hub
 # 初始化 OpenVINO 模型
@@ -20,8 +36,16 @@ config.top_k = 30;
 pipe = ov_genai.LLMPipeline(model_path, "CPU")
-#pipe.start_chat()
 def start_chat():
     pipe.start_chat()
@@ -36,7 +60,26 @@ def finish_chat():
 # 建立推論函式：使用 streamer 並回傳 generator 結果
 def generate_stream(prompt):
     prompt = prompt #+ " /no_think" + " 答案短且明瞭"
     q = queue.Queue()
     tps_result = ""
     def streamer(subword):
@@ -47,7 +90,7 @@ def generate_stream(prompt):
     def worker():
         # 在背景 thread 中做推論
         nonlocal tps_result
-        gen_result = pipe.generate([prompt], streamer=streamer, config=config)
         tps = gen_result.perf_metrics.get_throughput().mean
         tps_result = f"{tps:.2f} tokens/s"
         q.put(None)  # 結束符號

 import time
 from optimum.intel import OVModelForCausalLM, OVWeightQuantizationConfig
 import nncf
+from llama_index.core import SimpleDirectoryReader
+from rank_bm25 import BM25Okapi
+import jieba
+import subprocess
+import os
+os.makedirs("./data/", exist_ok=True)
+url = "https://www.cwa.gov.tw/V8/C/M/Fishery/tide_30day_MOD/T000311.html"
+output_dir = "./data/"
+cmd = ["wget", "-P", output_dir, url]
+try:
+    subprocess.run(cmd, check=True)
+    print("下載成功")
+except subprocess.CalledProcessError as e:
+    print("下載失敗:", e)
 import huggingface_hub as hf_hub
 # 初始化 OpenVINO 模型
 pipe = ov_genai.LLMPipeline(model_path, "CPU")
+pipe.get_tokenizer().set_chat_template(pipe.get_tokenizer().chat_template)
+# 載入文件（放 ./data 資料夾，支持多檔案）
+documents = SimpleDirectoryReader("./data").load_data()
+texts = [doc.get_content() for doc in documents]
+# 使用 jieba 斷詞做 BM25
+tokenized_corpus = [list(jieba.cut(text)) for text in texts]
+bm25 = BM25Okapi(tokenized_corpus)
 def start_chat():
     pipe.start_chat()
 # 建立推論函式：使用 streamer 並回傳 generator 結果
 def generate_stream(prompt):
     prompt = prompt #+ " /no_think" + " 答案短且明瞭"
+    tokenized_query = list(jieba.cut(prompt))
+    # BM25 取得 top 3 相關文件段落
+    top_k = 1
+    doc_scores = bm25.get_scores(tokenized_query)
+    top_k_indices = sorted(range(len(doc_scores)), key=lambda i: doc_scores[i], reverse=True)[:top_k]
+    retrieved_texts = [texts[i] for i in top_k_indices]
+    print("=== 檢索到的相關段落 ===")
+    for i, txt in enumerate(retrieved_texts, 1):
+        print(f"--- 段落 {i} ---\n{txt}\n")
+    # 拼接 prompt，避免全文貼上，只用 top3 段落
+    context = "\n\n".join(retrieved_texts)
+    final_prompt = f"根據以下資訊，請簡潔回答問題：\n{context}\n\n問題：{query}\n回答："
+    print("=== 最終 prompt ===")
+    print(final_prompt)
     q = queue.Queue()
     tps_result = ""
     def streamer(subword):
     def worker():
         # 在背景 thread 中做推論
         nonlocal tps_result
+        gen_result = pipe.generate([final_prompt], streamer=streamer, config=config)
         tps = gen_result.perf_metrics.get_throughput().mean
         tps_result = f"{tps:.2f} tokens/s"
         q.put(None)  # 結束符號