Spaces:

Vartex39
/

vizsum-pro

Running

App Files Files Community

Vartex39 commited on 2 days ago

Commit

e724b91

1 Parent(s): c4e9c8e

Fix: Info bloğu sadece PDF özetlerinde gösteriliyor, token limiti 1000'e düşürüldü

Browse files

Files changed (2) hide show

summarizer.py +1 -1
ui.py +20 -11

summarizer.py CHANGED Viewed

@@ -68,7 +68,7 @@ def summarize_text(text, mode, model_name="anthropic/claude-3-haiku", lang_mode=
         "messages": [
             {"role": "user", "content": build_prompt(text, mode, lang_mode, is_table)}
         ],
-        "max_tokens": 1300
     }
     try:

         "messages": [
             {"role": "user", "content": build_prompt(text, mode, lang_mode, is_table)}
         ],
+        "max_tokens": 1000
     }
     try:

ui.py CHANGED Viewed

@@ -7,33 +7,41 @@ from utils import chunk_text_by_tokens
 def process_input(pdf, image, manual_text, mode, model_name, start_page, end_page, lang_mode, is_table):
     if is_table and model_name != "anthropic/claude-3-haiku":
-        return "Tablo içeriği için yalnızca Claude önerilir.","",None
     if pdf is not None:
         text_chunks = extract_text_chunks_from_pdf(pdf, start=int(start_page), end=int(end_page))
         if any("[ERROR]" in chunk for chunk in text_chunks):
             return text_chunks[0], "", None
     elif image is not None:
         text = extract_text_from_image(image)
         if "[ERROR]" in text:
             return text, "", None
         text_chunks = [text]
     elif manual_text.strip() != "":
         text_chunks = [manual_text]
     else:
         return "Lütfen bir giriş türü seçin.", "", None
-    all_text = "\n\n".join(text_chunks)
-    chunk_count = len(chunk_text_by_tokens(all_text, max_tokens=1300))
-    info_block = f"""
-     Sayfa Aralığı: {start_page}–{end_page}
-     Model: {model_name}
-     Chunk Sayısı: {chunk_count}
-""".strip()
     full_summary = summarize_long_text(all_text, mode, model_name, lang_mode, is_table)
-    full_summary = f"{info_block}\n\n{full_summary}"
     temp_file = tempfile.NamedTemporaryFile(delete=False, suffix=".txt", mode='w', encoding='utf-8')
     temp_file.write(full_summary)
@@ -42,6 +50,7 @@ def process_input(pdf, image, manual_text, mode, model_name, start_page, end_pag
     return all_text, full_summary, temp_file.name
 with gr.Blocks() as demo:
     gr.Markdown("## VizSum")

 def process_input(pdf, image, manual_text, mode, model_name, start_page, end_page, lang_mode, is_table):
     if is_table and model_name != "anthropic/claude-3-haiku":
+        return "Tablo içeriği için yalnızca Claude önerilir.", "", None
+    info_block = ""
     if pdf is not None:
         text_chunks = extract_text_chunks_from_pdf(pdf, start=int(start_page), end=int(end_page))
         if any("[ERROR]" in chunk for chunk in text_chunks):
             return text_chunks[0], "", None
+        all_text = "\n\n".join(text_chunks)
+        chunk_count = len(chunk_text_by_tokens(all_text, max_tokens=1000))
+        info_block = f"""
+    Sayfa Aralığı: {start_page}–{end_page}
+    Model: {model_name}
+    Chunk Sayısı: {chunk_count}
+""".strip()
     elif image is not None:
         text = extract_text_from_image(image)
         if "[ERROR]" in text:
             return text, "", None
         text_chunks = [text]
+        all_text = text
     elif manual_text.strip() != "":
         text_chunks = [manual_text]
+        all_text = manual_text
     else:
         return "Lütfen bir giriş türü seçin.", "", None
     full_summary = summarize_long_text(all_text, mode, model_name, lang_mode, is_table)
+    if info_block:
+        full_summary = f"{info_block}\n\n{full_summary}"
     temp_file = tempfile.NamedTemporaryFile(delete=False, suffix=".txt", mode='w', encoding='utf-8')
     temp_file.write(full_summary)
     return all_text, full_summary, temp_file.name
 with gr.Blocks() as demo:
     gr.Markdown("## VizSum")