Update app.py
Browse files
app.py
CHANGED
@@ -518,7 +518,7 @@ def extract_keywords_from_text(text, query_words):
|
|
518 |
return matched_lines
|
519 |
|
520 |
def clean_text(text):
|
521 |
-
return re.sub(r'[
|
522 |
|
523 |
|
524 |
from collections import Counter
|
@@ -571,7 +571,7 @@ def remove_stop_words_from_lines(lines, stop_words):
|
|
571 |
return cleaned_lines
|
572 |
|
573 |
if query:
|
574 |
-
closest_lines = find_closest_lines(query, doc_texts, stop_words, top_n=
|
575 |
|
576 |
# حذف استپورد و پاکسازی خطوط
|
577 |
cleaned_closest_lines = [
|
@@ -580,7 +580,7 @@ if query:
|
|
580 |
]
|
581 |
|
582 |
# خلاصهسازی
|
583 |
-
summarized_text = summarize_text_by_frequency("\n".join(cleaned_closest_lines), num_sentences=
|
584 |
|
585 |
if summarized_text.strip():
|
586 |
prompt = f"""
|
|
|
518 |
return matched_lines
|
519 |
|
520 |
def clean_text(text):
|
521 |
+
return re.sub(r'[^آ-ی۰-،.؟!؛+\-* ]+', '', text)
|
522 |
|
523 |
|
524 |
from collections import Counter
|
|
|
571 |
return cleaned_lines
|
572 |
|
573 |
if query:
|
574 |
+
closest_lines = find_closest_lines(query, doc_texts, stop_words, top_n=5)
|
575 |
|
576 |
# حذف استپورد و پاکسازی خطوط
|
577 |
cleaned_closest_lines = [
|
|
|
580 |
]
|
581 |
|
582 |
# خلاصهسازی
|
583 |
+
summarized_text = summarize_text_by_frequency("\n".join(cleaned_closest_lines), num_sentences=1)
|
584 |
|
585 |
if summarized_text.strip():
|
586 |
prompt = f"""
|