Spaces:

Vartex39
/

vizsum-pro

Running

Vartex39 commited on 3 days ago

Commit

0303b9b

1 Parent(s): cc21f11

Claude 3 Haiku entegresi, tüm modüller güncellendi, prod-ready

Files changed (4) hide show

ocr_engine.py CHANGED Viewed

@@ -5,13 +5,20 @@ from dotenv import load_dotenv
 load_dotenv()
 ocr_api_key = os.getenv("OCR_SPACE_API_KEY")
-def extract_text_from_image(image_path):
     try:
-        if not isinstance(image_path, str) or not os.path.exists(image_path):
-            return "❌ Geçersiz dosya yolu."
-        with open(image_path, 'rb') as image_file:
-            image_data = image_file.read()
         response = requests.post(
             url='https://api.ocr.space/parse/image',
@@ -28,7 +35,7 @@ def extract_text_from_image(image_path):
         try:
             result = response.json()
         except Exception:
-            return f"❌ API yanıtı JSON formatında değil:\n{response.text}"
         if not isinstance(result, dict):
             return f"❌ API çıktısı sözlük değil:\n{result}"

 load_dotenv()
 ocr_api_key = os.getenv("OCR_SPACE_API_KEY")
+def extract_text_from_image(image_input):
     try:
+        if not ocr_api_key or not ocr_api_key.strip():
+            return "❌ OCR API anahtarı eksik."
+        # Hugging Face -> Gradio upload: image_input bir dosya yoludur (str)
+        # Local test: image_input file-like olabilir
+        if hasattr(image_input, "read"):
+            image_data = image_input.read()
+        elif isinstance(image_input, str) and os.path.exists(image_input):
+            with open(image_input, 'rb') as f:
+                image_data = f.read()
+        else:
+            return "❌ Geçersiz görsel girdisi."
         response = requests.post(
             url='https://api.ocr.space/parse/image',
         try:
             result = response.json()
         except Exception:
+            return f"❌ API yanıtı JSON değil:\n{response.text}"
         if not isinstance(result, dict):
             return f"❌ API çıktısı sözlük değil:\n{result}"

pdf_reader.py CHANGED Viewed

@@ -1,15 +1,29 @@
 import fitz  # PyMuPDF
 def extract_text_from_pdf(pdf_input):
     try:
-        if isinstance(pdf_input, str):
             doc = fitz.open(pdf_input)
         else:
-            doc = fitz.open(stream=pdf_input.read(), filetype="pdf")
-        text = "\n".join([page.get_text() for page in doc])
         doc.close()
         return text
     except Exception as e:
-        return f"❌ PDF İşleme Hatası: {str(e)}"

 import fitz  # PyMuPDF
+MAX_PAGES = 5  # fazla token yememesi için sınır
 def extract_text_from_pdf(pdf_input):
     try:
+        # Hugging Face ortamında pdf_input bir file-like objedir (upload edilen dosya)
+        if hasattr(pdf_input, "read"):
+            doc = fitz.open(stream=pdf_input.read(), filetype="pdf")
+        elif isinstance(pdf_input, str):
             doc = fitz.open(pdf_input)
         else:
+            return "[ERROR] Geçersiz PDF girişi"
+        total_pages = len(doc)
+        text = ""
+        for i in range(min(MAX_PAGES, total_pages)):
+            text += doc[i].get_text()
         doc.close()
+        if total_pages > MAX_PAGES:
+            text += f"\n\n[INFO] PDF {total_pages} sayfa. Yalnızca ilk {MAX_PAGES} sayfa işlendi."
         return text
     except Exception as e:
+        return f"[ERROR] PDF İşleme Hatası: {str(e)}"

summarizer.py CHANGED Viewed

@@ -3,8 +3,9 @@ import requests
 from dotenv import load_dotenv
 load_dotenv()
-api_key = os.getenv("OPENROUTER_API_KEY").strip()
 def build_prompt(text, mode):
     if "Sade" in mode:
@@ -23,17 +24,24 @@ def build_prompt(text, mode):
 def summarize_text(text, mode):
     url = "https://openrouter.ai/api/v1/chat/completions"
     headers = {
-        "Authorization": f"Bearer {api_key}",
         "Content-Type": "application/json"
     }
-    data = {
-        "model": "openai/gpt-3.5-turbo",
         "messages": [
             {"role": "user", "content": build_prompt(text, mode)}
         ]
     }
-    response = requests.post(url, headers=headers, json=data)
-    response.raise_for_status()
-    return response.json()['choices'][0]['message']['content']

 from dotenv import load_dotenv
 load_dotenv()
+api_key = os.getenv("OPENROUTER_API_KEY")
+if not api_key or not api_key.strip():
+    raise RuntimeError("❌ OPENROUTER_API_KEY bulunamadı. Hugging Face Secrets kısmına eklenmeli.")
 def build_prompt(text, mode):
     if "Sade" in mode:
 def summarize_text(text, mode):
     url = "https://openrouter.ai/api/v1/chat/completions"
     headers = {
+        "Authorization": f"Bearer {api_key.strip()}",
         "Content-Type": "application/json"
     }
+    payload = {
+        "model": "anthropic/claude-3-haiku",
         "messages": [
             {"role": "user", "content": build_prompt(text, mode)}
         ]
     }
+    try:
+        response = requests.post(url, headers=headers, json=payload)
+        response.raise_for_status()
+        result = response.json()
+        return result['choices'][0]['message']['content'].strip()
+    except requests.exceptions.HTTPError as e:
+        return f"❌ HTTP Hatası: {e} | Yanıt: {response.text}"
+    except Exception as e:
+        return f"❌ Sistemsel Hata: {str(e)}"

ui.py CHANGED Viewed

@@ -13,42 +13,39 @@ def process_input(pdf, image, manual_text, mode):
     else:
         return "Lütfen bir giriş türü seçin.", ""
     summary = summarize_text(text, mode)
     return text, summary
 with gr.Blocks() as demo:
-    gr.Markdown("## 📚 VizSum Pro+: AI Destekli Özetleyici")
     with gr.Row():
-        pdf_input = gr.File(label="📄 PDF Yükle", file_types=[".pdf"])
-        image_input = gr.Image(type="filepath", label="🖼️ Görsel Yükle")
-    manual_input = gr.Textbox(lines=5, label="✍️ Metni Manuel Gir")
-    # BURAYA AL
     mode_selector = gr.Dropdown(
-        choices=["📘 Teknik Özet", "🧒 Sade Anlatım", "🧠 Eleştir ve Değerlendir", "📝 Başlık Çıkar", "📎 Not Formatı"],
-        label="🧩 Özetleme Modu",
-        value="📘 Teknik Özet"
     )
     with gr.Row():
         submit_btn = gr.Button("Özetle")
     with gr.Row():
-        text_output = gr.Textbox(label="📜 Metin")
-        summary_output = gr.Textbox(label="🧠 AI Özeti")
-    # EN SONDA KALACAK
     submit_btn.click(
         fn=process_input,
         inputs=[pdf_input, image_input, manual_input, mode_selector],
         outputs=[text_output, summary_output]
     )
 if __name__ == "__main__":
-    demo.launch(share=True)

     else:
         return "Lütfen bir giriş türü seçin.", ""
+    if "[ERROR]" in text or "[INFO]" in text:
+        return text, ""
     summary = summarize_text(text, mode)
     return text, summary
 with gr.Blocks() as demo:
+    gr.Markdown("## VizSum Pro+: AI Destekli Özetleme Aracı")
     with gr.Row():
+        pdf_input = gr.File(label="PDF Yükle", file_types=[".pdf"])
+        image_input = gr.Image(type="filepath", label="Görsel Yükle")
+    manual_input = gr.Textbox(lines=5, label="Metni Manuel Gir")
     mode_selector = gr.Dropdown(
+        choices=["Teknik Özet", "Sade Anlatım", "Eleştir ve Değerlendir", "Başlık Çıkar", "Not Formatı"],
+        label="Özetleme Modu",
+        value="Teknik Özet"
     )
     with gr.Row():
         submit_btn = gr.Button("Özetle")
     with gr.Row():
+        text_output = gr.Textbox(label="Giriş Metni")
+        summary_output = gr.Textbox(label="AI Özeti")
     submit_btn.click(
         fn=process_input,
         inputs=[pdf_input, image_input, manual_input, mode_selector],
         outputs=[text_output, summary_output]
     )
 if __name__ == "__main__":
+    demo.launch(share=True)