Spaces:

bvd757
/

checked

Sleeping

App Files Files Community

bvd757 commited on May 10

Commit

aff21a4

1 Parent(s): 407e6f0

no false errors

Browse files

Files changed (1) hide show

search_errors_logic.py +32 -3

search_errors_logic.py CHANGED Viewed

@@ -2,6 +2,28 @@ import openai
 from openai import OpenAI
 import difflib
 prompt_fix_text_gpt = """
 Исправь ошибки в данном тексте. Текст в makrdown и должен в результате остаться в markdown.
 Жаргонизмы считаются ошибками, приемлим только официальный стиль.
@@ -127,7 +149,7 @@ def get_gpt_response_vsegpt(inp):
     return response
-def get_gpt_response(inp, client_name):
     if client_name == "openai":
         return get_gpt_response_openai(inp)
     elif client_name == "vsegpt":
@@ -223,6 +245,10 @@ def check_text_chat_gpt(text, fixed_text=None, add_errors=False, *args, **kwargs
 def check_text_chat_gpt_highlight_mode(text, fixed_text=None, add_errors=False, *args, **kwargs):
     if fixed_text is None:
         fixed_text = get_gpt_response(prompt_fix_text_gpt.format(text), "vsegpt")
     changes = find_corrected_positions(text, fixed_text)
     bounds_init = []
     for change in changes:
@@ -244,8 +270,11 @@ def check_text_chat_gpt_highlight_mode(text, fixed_text=None, add_errors=False,
     errors = []
     for bound in bounds_result:
-        inp = prompt_compare_get_comment.format(text[bound["start_orig"]:bound["end_orig"]],
-                                                fixed_text[bound["start_corr"]:bound["end_corr"]])
         errors.append({
             'start': bound["start_orig"],
             'end': bound["end_orig"],

 from openai import OpenAI
 import difflib
+prompt_is_there_error = """Ты — лингвистический анализатор. Тебе будут даны две текстовые строки:
+1. Оригинальный текст (точно без ошибок)
+2. Текст для проверки (может содержать ошибку или альтернативное написание)
+Задача:
+- Сравни второй текст с оригиналом на предмет наличия ошибок (орфографических, пунктуационных, грамматических)
+- Если во втором тексте есть ошибка (отличается от оригинала и это не допустимый вариант написания) — верни 1
+- Если текст совпадает с оригиналом или отличается только допустимыми вариантами написания (синонимы, альтернативная пунктуация и т.п.) — верни 0
+Формат ответа — строго JSON:
+```json
+{
+  "result": 0|1
+}
+Оригинальный текст:
+{}
+Текст для проверки:
+{}
+"""
 prompt_fix_text_gpt = """
 Исправь ошибки в данном тексте. Текст в makrdown и должен в результате остаться в markdown.
 Жаргонизмы считаются ошибками, приемлим только официальный стиль.
     return response
+def get_gpt_response(inp, client_name="vsegpt"):
     if client_name == "openai":
         return get_gpt_response_openai(inp)
     elif client_name == "vsegpt":
 def check_text_chat_gpt_highlight_mode(text, fixed_text=None, add_errors=False, *args, **kwargs):
     if fixed_text is None:
         fixed_text = get_gpt_response(prompt_fix_text_gpt.format(text), "vsegpt")
+    text = text.replace("ё", "е")
+    fixed_text = fixed_text.replace("ё", "е")
     changes = find_corrected_positions(text, fixed_text)
     bounds_init = []
     for change in changes:
     errors = []
     for bound in bounds_result:
+        orig_piece = text[bound["start_orig"]:bound["end_orig"]]
+        fixed_piece = fixed_text[bound["start_corr"]:bound["end_corr"]]
+        if "0" in get_gpt_response(prompt_is_there_error.format(orig_piece, fixed_piece)):
+            continue
+        inp = prompt_compare_get_comment.format(orig_piece, fixed_piece)
         errors.append({
             'start': bound["start_orig"],
             'end': bound["end_orig"],