Spaces:

3a05chatgpt
/

pdf-summarizer-app

Sleeping

App Files Files Community

3a05chatgpt commited on 22 days ago

Commit

a3f064a

verified ·

1 Parent(s): ca9cc44

Update app.py

Browse files

Files changed (1) hide show

app.py +209 -49

app.py CHANGED Viewed

@@ -1,6 +1,6 @@
 import openai
 import gradio as gr
-import fitz
 from openai import OpenAI
 import traceback
@@ -12,121 +12,281 @@ client = None
 pdf_text = ""
 def set_api_key(user_api_key):
     global api_key, client
     try:
         api_key = user_api_key.strip()
         if not api_key:
             return "❌ API Key 不能為空"
         client = OpenAI(api_key=api_key)
-        client.chat.completions.create(
-            model="gpt-4",
-            messages=[{"role": "user", "content": "你好"}],
-            max_tokens=5
-        )
-        return "✅ API Key 已設定並驗證成功"
     except Exception as e:
-        return f"❌ API Key 設定失敗: {str(e)}"
 def set_model(model_name):
     global selected_model
-    selected_model = model_name
-    return f"✅ 模型已選擇：{model_name}"
 def extract_pdf_text(file_path):
     try:
         doc = fitz.open(file_path)
         text = ""
         for page_num, page in enumerate(doc):
             page_text = page.get_text()
             if page_text.strip():
-                text += f"\n--- 第 {page_num + 1} 頁 ---\n{page_text}"
         doc.close()
         return text
     except Exception as e:
         return f"❌ PDF 解析錯誤: {str(e)}"
 def generate_summary(pdf_file):
     global summary_text, pdf_text
     if not client:
-        return "❌ 請先設定 API Key"
     if not pdf_file:
         return "❌ 請先上傳 PDF 文件"
     try:
         pdf_text = extract_pdf_text(pdf_file.name)
         if not pdf_text.strip():
-            return "⚠️ 無法解析 PDF 文字"
-        pdf_text_truncated = pdf_text[:8000]
         response = client.chat.completions.create(
             model=selected_model,
             messages=[
-                {"role": "system", "content": "請用繁體中文整理以下 PDF 內容摘要。"},
                 {"role": "user", "content": pdf_text_truncated}
             ],
             temperature=0.3
         )
         summary_text = response.choices[0].message.content
         return summary_text
     except Exception as e:
-        print(traceback.format_exc())
-        return f"❌ 摘要生成失敗: {str(e)}"
 def ask_question(user_question):
     if not client:
-        return "❌ 請先設定 API Key"
     if not summary_text and not pdf_text:
         return "❌ 請先生成 PDF 摘要"
     if not user_question.strip():
         return "❌ 請輸入問題"
     try:
         context = f"PDF 摘要:\n{summary_text}\n\n原始���容（部分）:\n{pdf_text[:2000]}"
         response = client.chat.completions.create(
             model=selected_model,
             messages=[
-                {"role": "system", "content": f"根據以下 PDF 內容回答問題，用繁體中文：\n{context}"},
                 {"role": "user", "content": user_question}
             ],
             temperature=0.2
         )
         return response.choices[0].message.content
     except Exception as e:
-        print(traceback.format_exc())
-        return f"❌ 問答生成失敗: {str(e)}"
 def clear_all():
     global summary_text, pdf_text
     summary_text = ""
     pdf_text = ""
     return "", "", ""
-with gr.Blocks(title="PDF 摘要助手") as demo:
-    gr.Markdown("## 📄 PDF 摘要 & 問答助手")
     with gr.Tab("🔧 設定"):
-        api_key_input = gr.Textbox(label="輸入 OpenAI API Key", type="password")
-        api_key_status = gr.Textbox(label="API 狀態", interactive=False)
-        api_key_btn = gr.Button("確認 API Key")
-        api_key_btn.click(set_api_key, inputs=api_key_input, outputs=api_key_status)
-        model_choice = gr.Radio(["gpt-4", "gpt-4.1", "gpt-4.5"], label="選擇 AI 模型", value="gpt-4")
-        model_status = gr.Textbox(label="模型狀態", interactive=False, value="✅ 已選擇：gpt-4")
-        model_choice.change(set_model, inputs=model_choice, outputs=model_status)
-    with gr.Tab("📄 摘要"):
-        pdf_upload = gr.File(label="上傳 PDF", file_types=[".pdf"])
-        summary_btn = gr.Button("生成摘要")
-        summary_output = gr.Textbox(label="PDF 摘要", lines=10)
-        summary_btn.click(generate_summary, inputs=pdf_upload, outputs=summary_output)
     with gr.Tab("❓ 問答"):
-        question_input = gr.Textbox(label="請輸入問題", lines=2)
-        question_btn = gr.Button("送出問題")
-        answer_output = gr.Textbox(label="AI 回答", lines=8)
-        question_btn.click(ask_question, inputs=question_input, outputs=answer_output)
-        question_input.submit(ask_question, inputs=question_input, outputs=answer_output)
-    clear_btn = gr.Button("清除所有資料")
-    clear_btn.click(clear_all, outputs=[summary_output, question_input, answer_output])
 if __name__ == "__main__":
-    demo.launch(show_error=True)

 import openai
 import gradio as gr
+import fitz  # PyMuPDF
 from openai import OpenAI
 import traceback
 pdf_text = ""
 def set_api_key(user_api_key):
+    """設定 OpenAI API Key 並初始化客戶端"""
     global api_key, client
     try:
         api_key = user_api_key.strip()
         if not api_key:
             return "❌ API Key 不能為空"
+        if not api_key.startswith('sk-'):
+            return "❌ API Key 格式錯誤，應該以 'sk-' 開頭"
         client = OpenAI(api_key=api_key)
+        # 測試 API Key 是否有效
+        try:
+            test_response = client.chat.completions.create(
+                model="gpt-3.5-turbo",
+                messages=[{"role": "user", "content": "Hello"}],
+                max_tokens=5
+            )
+            return "✅ API Key 已設定並驗證成功！可以開始使用了。"
+        except Exception as e:
+            if "incorrect_api_key" in str(e).lower():
+                return "❌ API Key 無效，請檢查是否正確"
+            elif "quota" in str(e).lower():
+                return "⚠️ API Key 有效，但配額不足"
+            else:
+                return f"⚠️ API Key 設定成功，但測試時出現問題：{str(e)[:100]}"
     except Exception as e:
+        return f"❌ 設定失敗：{str(e)}"
 def set_model(model_name):
+    """設定選擇的模型"""
     global selected_model
+    if model_name:
+        selected_model = model_name
+        return f"✅ 模型已更新為：{model_name}"
+    else:
+        return "❌ 請選擇一個模型"
 def extract_pdf_text(file_path):
+    """從 PDF 文件中提取文字"""
     try:
         doc = fitz.open(file_path)
         text = ""
         for page_num, page in enumerate(doc):
             page_text = page.get_text()
             if page_text.strip():
+                text += f"\n--- 第 {page_num + 1} 頁 ---\n"
+                text += page_text
         doc.close()
         return text
     except Exception as e:
         return f"❌ PDF 解析錯誤: {str(e)}"
 def generate_summary(pdf_file):
+    """從 PDF 內容生成摘要"""
     global summary_text, pdf_text
     if not client:
+        return "❌ 請先設定 OpenAI API Key"
     if not pdf_file:
         return "❌ 請先上傳 PDF 文件"
     try:
         pdf_text = extract_pdf_text(pdf_file.name)
         if not pdf_text.strip():
+            return "⚠️ 無法解析 PDF 文字，可能為純圖片 PDF 或空白文件。"
+        max_chars = 8000
+        if len(pdf_text) > max_chars:
+            pdf_text_truncated = pdf_text[:max_chars] + "\n\n[文本已截斷，僅顯示前 8000 字符]"
+        else:
+            pdf_text_truncated = pdf_text
         response = client.chat.completions.create(
             model=selected_model,
             messages=[
+                {
+                    "role": "system",
+                    "content": """你是一個專業的文檔摘要助手。請將以下 PDF 內容整理為結構化的摘要：
+1. 首先提供一個簡短的總體概述
+2. 然後按照重要性列出主要重點（使用項目符號）
+3. 如果有數據或統計信息，請特別標注
+4. 如果有結論或建議，請單獨列出
+請用繁體中文回答，保持專業且易於理解的語調。"""
+                },
                 {"role": "user", "content": pdf_text_truncated}
             ],
             temperature=0.3
         )
         summary_text = response.choices[0].message.content
         return summary_text
     except Exception as e:
+        error_msg = f"❌ 摘要生成失敗: {str(e)}"
+        print(f"錯誤詳情: {traceback.format_exc()}")
+        return error_msg
 def ask_question(user_question):
+    """基於 PDF 內容回答問題"""
     if not client:
+        return "❌ 請先設定 OpenAI API Key"
     if not summary_text and not pdf_text:
         return "❌ 請先生成 PDF 摘要"
     if not user_question.strip():
         return "❌ 請輸入問題"
     try:
         context = f"PDF 摘要:\n{summary_text}\n\n原始���容（部分）:\n{pdf_text[:2000]}"
         response = client.chat.completions.create(
             model=selected_model,
             messages=[
+                {
+                    "role": "system",
+                    "content": f"""你是一個專業的文檔問答助手。請基於提供的 PDF 內容回答用戶問題。
+規則：
+1. 只根據提供的文檔內容回答
+2. 如果文檔中沒有相關信息，請明確說明
+3. 引用具體的文檔內容來支持你的回答
+4. 用繁體中文回答
+5. 保持客觀和準確
+文檔內容：
+{context}"""
+                },
                 {"role": "user", "content": user_question}
             ],
             temperature=0.2
         )
         return response.choices[0].message.content
     except Exception as e:
+        error_msg = f"❌ 問答生成失敗: {str(e)}"
+        print(f"錯誤詳情: {traceback.format_exc()}")
+        return error_msg
 def clear_all():
+    """清除所有資料"""
     global summary_text, pdf_text
     summary_text = ""
     pdf_text = ""
     return "", "", ""
+# 創建最簡單的 Gradio 介面
+with gr.Blocks(
+    title="PDF 摘要助手",
+    css="""
+    /* 隱藏 Gradio logo 和 footer */
+    footer { display: none !important; }
+    .gradio-container footer { display: none !important; }
+    div[class*="footer"] { display: none !important; }
+    div[class*="Footer"] { display: none !important; }
+    .gr-footer { display: none !important; }
+    /* 強制修復按鈕 */
+    button {
+        pointer-events: auto !important;
+        z-index: 9999 !important;
+        position: relative !important;
+        cursor: pointer !important;
+    }
+    """
+) as demo:
+    gr.Markdown("# 📄 PDF 摘要 & 問答助手")
     with gr.Tab("🔧 設定"):
+        gr.Markdown("## API Key 設定")
+        api_key_input = gr.Textbox(
+            label="輸入 OpenAI API Key",
+            type="password",
+            placeholder="請輸入您的 OpenAI API Key (sk-...)"
+        )
+        with gr.Row():
+            api_key_btn = gr.Button("確認設定 API Key", variant="primary")
+        api_key_status = gr.Textbox(
+            label="API 狀態",
+            interactive=False,
+            value="等待設定 API Key..."
+        )
+        gr.Markdown("## 模型選擇")
+        model_choice = gr.Radio(
+            choices=["gpt-4", "gpt-4.1", "gpt-4.5"],
+            label="選擇 AI 模型",
+            value="gpt-4"
+        )
+        with gr.Row():
+            model_btn = gr.Button("確認選擇模型", variant="secondary")
+        model_status = gr.Textbox(
+            label="當前模型",
+            interactive=False,
+            value="已選擇：gpt-4"
+        )
+    with gr.Tab("📄 PDF 處理"):
+        gr.Markdown("## 上傳 PDF 文件")
+        pdf_upload = gr.File(
+            label="選擇 PDF 文件",
+            file_types=[".pdf"]
+        )
+        with gr.Row():
+            summary_btn = gr.Button("生成摘要", variant="primary")
+            clear_btn = gr.Button("清除資料", variant="secondary")
+        summary_output = gr.Textbox(
+            label="PDF 摘要",
+            lines=15,
+            placeholder="上傳 PDF 文件並點擊「生成摘要」按鈕"
+        )
     with gr.Tab("❓ 問答"):
+        gr.Markdown("## AI 問答")
+        question_input = gr.Textbox(
+            label="請輸入您的問題",
+            placeholder="例如：這份文件的主要結論是什麼？",
+            lines=3
+        )
+        with gr.Row():
+            question_btn = gr.Button("發送問題", variant="primary")
+        answer_output = gr.Textbox(
+            label="AI 回答",
+            lines=10,
+            placeholder="AI 回答將顯示在這裡"
+        )
+    # 事件綁定 - 使用最明確的方式
+    def handle_api_key():
+        return set_api_key(api_key_input.value if hasattr(api_key_input, 'value') else "")
+    def handle_model():
+        return set_model(model_choice.value if hasattr(model_choice, 'value') else "gpt-4")
+    def handle_summary():
+        return generate_summary(pdf_upload.value if hasattr(pdf_upload, 'value') else None)
+    def handle_question():
+        return ask_question(question_input.value if hasattr(question_input, 'value') else "")
+    # 綁定點擊事件
+    api_key_btn.click(set_api_key, inputs=[api_key_input], outputs=[api_key_status])
+    model_btn.click(set_model, inputs=[model_choice], outputs=[model_status])
+    summary_btn.click(generate_summary, inputs=[pdf_upload], outputs=[summary_output])
+    question_btn.click(ask_question, inputs=[question_input], outputs=[answer_output])
+    clear_btn.click(clear_all, inputs=[], outputs=[summary_output, question_input, answer_output])
+    # Enter 鍵支援
+    api_key_input.submit(set_api_key, inputs=[api_key_input], outputs=[api_key_status])
+    question_input.submit(ask_question, inputs=[question_input], outputs=[answer_output])
 if __name__ == "__main__":
+    demo.launch(
+        share=False,
+        show_api=False,
+        show_error=True,
+        favicon_path=None
+    )