Spaces:

3a05chatgpt
/

pdf-summarizer-app

Sleeping

App Files Files Community

3a05chatgpt commited on 4 days ago

Commit

6ae9e47

verified ·

1 Parent(s): 471dcf3

Update app.py

Browse files

Files changed (1) hide show

app.py +56 -324

app.py CHANGED Viewed

@@ -1,6 +1,6 @@
 import openai
 import gradio as gr
-import fitz
 from openai import OpenAI
 import traceback
@@ -19,15 +19,16 @@ def set_api_key(user_api_key):
         if not api_key:
             return "❌ API Key 不能為空"
-        if not api_key.startswith('sk-'):
-            return "❌ API Key 格式錯誤，應該以 'sk-' 開頭"
         client = OpenAI(api_key=api_key)
         # 測試 API Key 是否有效
         test_response = client.chat.completions.create(
-            model="gpt-3.5-turbo",  # 使用較便宜的模型測試
-            messages=[{"role": "user", "content": "測試"}],
             max_tokens=5
         )
         return "✅ API Key 已設定並驗證成功！"
@@ -40,13 +41,11 @@ def set_api_key(user_api_key):
             return f"❌ API Key 設定失敗: {str(e)}"
 def set_model(model_name):
-    """設定選擇的模型"""
     global selected_model
     selected_model = model_name
     return f"✅ 模型已選擇：{model_name}"
 def extract_pdf_text(file_path):
-    """從 PDF 文件中提取文字"""
     try:
         doc = fitz.open(file_path)
         text = ""
@@ -60,371 +59,104 @@ def extract_pdf_text(file_path):
         return f"❌ PDF 解析錯誤: {str(e)}"
 def generate_summary(pdf_file):
-    """從 PDF 內容生成摘要"""
     global summary_text, pdf_text
     if not client:
         return "❌ 請先設定 OpenAI API Key"
     if not pdf_file:
         return "❌ 請先上傳 PDF 文件"
     try:
-        # 從 PDF 提取文字
         pdf_text = extract_pdf_text(pdf_file.name)
         if not pdf_text.strip():
             return "⚠️ 無法解析 PDF 文字，可能為純圖片 PDF 或空白文件。"
-        # 截斷過長的文字
-        max_chars = 8000
-        if len(pdf_text) > max_chars:
-            pdf_text_truncated = pdf_text[:max_chars] + "\n\n[文本已截斷，僅顯示前 8000 字符]"
-        else:
-            pdf_text_truncated = pdf_text
-        # 生成摘要
         response = client.chat.completions.create(
             model=selected_model,
             messages=[
-                {
-                    "role": "system",
-                    "content": """你是一個專業的文檔摘要助手。請將以下 PDF 內容整理為結構化的摘要：
-1. 首先提供一個簡短的總體概述
-2. 然後按照重要性列出主要重點（使用項目符號）
-3. 如果有數據或統計信息，請特別標注
-4. 如果有結論或建議，請單獨列出
-請用繁體中文回答，保持專業且易於理解的語調。"""
-                },
                 {"role": "user", "content": pdf_text_truncated}
             ],
             temperature=0.3
         )
         summary_text = response.choices[0].message.content
         return summary_text
     except Exception as e:
-        print(f"錯誤詳情: {traceback.format_exc()}")
         return f"❌ 摘要生成失敗: {str(e)}"
 def ask_question(user_question):
-    """基於 PDF 內容回答問題"""
     if not client:
         return "❌ 請先設定 OpenAI API Key"
     if not summary_text and not pdf_text:
         return "❌ 請先生成 PDF 摘要"
     if not user_question.strip():
         return "❌ 請輸入問題"
     try:
-        # 組合上下文
         context = f"PDF 摘要:\n{summary_text}\n\n原始內容（部分）:\n{pdf_text[:2000]}"
         response = client.chat.completions.create(
             model=selected_model,
             messages=[
-                {
-                    "role": "system",
-                    "content": f"""你是一個專業的文檔問答助手。請基於提供的 PDF 內容回答用戶問題。
-規則：
-1. 只根據提供的文檔內容回答
-2. 如果文檔中沒有相關信息，請明確說明
-3. 引用具體的文檔內容來支持你的回答
-4. 用繁體中文回答
-5. 保持客觀和準確
-文檔內容：
-{context}"""
-                },
                 {"role": "user", "content": user_question}
             ],
             temperature=0.2
         )
         return response.choices[0].message.content
     except Exception as e:
-        print(f"錯誤詳情: {traceback.format_exc()}")
         return f"❌ 問答生成失敗: {str(e)}"
 def clear_all():
-    """清除所有資料"""
     global summary_text, pdf_text
     summary_text = ""
     pdf_text = ""
     return "", "", ""
-# 自定義 CSS 樣式 - 藍紫色主題
-custom_css = """
-/* 主要容器背景 */
-.gradio-container {
-    background: linear-gradient(135deg, #667eea 0%, #764ba2 100%) !important;
-    min-height: 100vh;
-}
-/* 隱藏 Gradio footer 和 logo */
-footer { display: none !important; }
-.gradio-container footer { display: none !important; }
-div[class*="footer"] { display: none !important; }
-div[class*="Footer"] { display: none !important; }
-.gr-footer { display: none !important; }
-/* 標籤頁樣式 */
-.tab-nav {
-    background: rgba(255, 255, 255, 0.1) !important;
-    border-radius: 15px !important;
-    backdrop-filter: blur(10px) !important;
-    margin-bottom: 20px !important;
-}
-.tab-nav button {
-    background: rgba(255, 255, 255, 0.1) !important;
-    color: white !important;
-    border: none !important;
-    border-radius: 10px !important;
-    margin: 5px !important;
-    font-weight: 600 !important;
-    transition: all 0.3s ease !important;
-}
-.tab-nav button:hover {
-    background: rgba(255, 255, 255, 0.2) !important;
-    transform: translateY(-2px) !important;
-}
-.tab-nav button.selected {
-    background: rgba(255, 255, 255, 0.3) !important;
-    box-shadow: 0 4px 15px rgba(0, 0, 0, 0.2) !important;
-}
-/* 卡片樣式 */
-.block {
-    background: rgba(255, 255, 255, 0.95) !important;
-    border-radius: 20px !important;
-    box-shadow: 0 8px 32px rgba(0, 0, 0, 0.1) !important;
-    backdrop-filter: blur(10px) !important;
-    border: 1px solid rgba(255, 255, 255, 0.2) !important;
-    margin: 10px 0 !important;
-    padding: 20px !important;
-}
-/* 按鈕樣式 */
-.btn {
-    background: linear-gradient(45deg, #667eea, #764ba2) !important;
-    color: white !important;
-    border: none !important;
-    border-radius: 15px !important;
-    padding: 12px 24px !important;
-    font-weight: 600 !important;
-    transition: all 0.3s ease !important;
-    box-shadow: 0 4px 15px rgba(102, 126, 234, 0.4) !important;
-}
-.btn:hover {
-    transform: translateY(-3px) !important;
-    box-shadow: 0 6px 20px rgba(102, 126, 234, 0.6) !important;
-}
-.btn-secondary {
-    background: linear-gradient(45deg, #a8a8a8, #6c757d) !important;
-    box-shadow: 0 4px 15px rgba(168, 168, 168, 0.4) !important;
-}
-.btn-secondary:hover {
-    box-shadow: 0 6px 20px rgba(168, 168, 168, 0.6) !important;
-}
-/* 輸入框樣式 */
-.gr-textbox, .gr-file, .gr-radio {
-    border-radius: 15px !important;
-    border: 2px solid rgba(102, 126, 234, 0.3) !important;
-    background: rgba(255, 255, 255, 0.9) !important;
-    transition: all 0.3s ease !important;
-}
-.gr-textbox:focus, .gr-file:focus {
-    border-color: #667eea !important;
-    box-shadow: 0 0 20px rgba(102, 126, 234, 0.3) !important;
-}
-/* 標題樣式 */
-h1, h2, h3 {
-    color: white !important;
-    text-shadow: 2px 2px 4px rgba(0, 0, 0, 0.3) !important;
-    font-weight: 700 !important;
-}
-/* Markdown 內容樣式 */
-.markdown {
-    background: rgba(255, 255, 255, 0.95) !important;
-    border-radius: 15px !important;
-    padding: 20px !important;
-    margin: 10px 0 !important;
-    box-shadow: 0 4px 15px rgba(0, 0, 0, 0.1) !important;
-}
-/* 進度條樣式 */
-.progress {
-    background: linear-gradient(45deg, #667eea, #764ba2) !important;
-    border-radius: 10px !important;
-}
-/* 滾動條樣式 */
-::-webkit-scrollbar {
-    width: 8px;
-}
-::-webkit-scrollbar-track {
-    background: rgba(255, 255, 255, 0.1);
-    border-radius: 10px;
-}
-::-webkit-scrollbar-thumb {
-    background: linear-gradient(45deg, #667eea, #764ba2);
-    border-radius: 10px;
-}
-::-webkit-scrollbar-thumb:hover {
-    background: linear-gradient(45deg, #5a6fd8, #6a4190);
-}
-/* 動畫效果 */
-@keyframes fadeIn {
-    from { opacity: 0; transform: translateY(20px); }
-    to { opacity: 1; transform: translateY(0); }
-}
-.block {
-    animation: fadeIn 0.6s ease-out !important;
-}
-"""
-# 創建 Gradio 介面
 with gr.Blocks(
     title="PDF 摘要助手",
-    css=custom_css,
-    theme=gr.themes.Soft(
-        primary_hue="blue",
-        secondary_hue="purple",
-        neutral_hue="slate",
-    )
 ) as demo:
-    gr.Markdown("""
-    # 📄 PDF 摘要 & 問答助手
-    🚀 **歡迎使用 PDF 智能分析工具！**
-    **主要功能：**
-    - 📋 自動生成 PDF 文檔摘要
-    - 🤖 基於文檔內容回答問題
-    - 💡 快速理解長篇文檔的核心��容
-    **使用步驟：**
-    1. 先在「設定」頁面輸入您的 OpenAI API Key
-    2. 選擇適合的 AI 模型
-    3. 在「摘要」頁面上傳 PDF 文件並生成摘要
-    4. 在「問答」頁面提出關於文件的問題
-    ---
-    """)
-    with gr.Tab("🔧 設定"):
-        gr.Markdown("### API Key 設定")
-        api_key_input = gr.Textbox(
-            label="🔑 輸入 OpenAI API Key",
-            type="password",
-            placeholder="請輸入您的 OpenAI API Key (sk-...)",
-            elem_classes=["gr-textbox"]
-        )
-        api_key_btn = gr.Button("確認 API Key", variant="primary", elem_classes=["btn"])
-        api_key_status = gr.Textbox(
-            label="📊 API 狀態",
-            interactive=False,
-            value="🔄 等待設定 API Key...",
-            elem_classes=["gr-textbox"]
-        )
-        gr.Markdown("### 模型選擇")
-        model_choice = gr.Radio(
-            ["gpt-4", "gpt-4.1", "gpt-4.5"],
-            label="🤖 選擇 AI 模型",
-            value="gpt-4",
-            elem_classes=["gr-radio"]
-        )
-        model_status = gr.Textbox(
-            label="🎯 模型狀態",
-            interactive=False,
-            value="✅ 已選擇：gpt-4",
-            elem_classes=["gr-textbox"]
-        )
-    with gr.Tab("📄 PDF 摘要"):
-        gr.Markdown("### 文件上傳與摘要生成")
-        pdf_upload = gr.File(
-            label="📁 上傳 PDF 文件",
-            file_types=[".pdf"],
-            elem_classes=["gr-file"]
-        )
-        with gr.Row():
-            summary_btn = gr.Button("🔄 生成摘要", variant="primary", elem_classes=["btn"])
-            clear_btn = gr.Button("🗑️ 清除資料", variant="secondary", elem_classes=["btn", "btn-secondary"])
-        summary_output = gr.Textbox(
-            label="📋 PDF 摘要",
-            lines=15,
-            placeholder="上傳 PDF 文件並點擊「生成摘要」按鈕，AI 將為您分析文檔內容...",
-            elem_classes=["gr-textbox"]
-        )
-    with gr.Tab("❓ 智能問答"):
-        gr.Markdown("### 基於文檔內容的問答")
-        question_input = gr.Textbox(
-            label="💭 請輸入您的問題",
-            lines=3,
-            placeholder="例如：這份文件的主要結論是什麼？文中提到的關鍵數據有哪些？",
-            elem_classes=["gr-textbox"]
-        )
-        question_btn = gr.Button("📤 送出問題", variant="primary", elem_classes=["btn"])
-        answer_output = gr.Textbox(
-            label="🤖 AI 回答",
-            lines=12,
-            placeholder="請先上傳並生成 PDF 摘要，然後輸入問題，AI 將基於文檔內容為您提供回答...",
-            elem_classes=["gr-textbox"]
-        )
-        gr.Markdown("""
-        **💡 問題範例：**
-        - 這份文件討論的主要議題是什麼？
-        - 文中有哪些重要的統計數據？
-        - 作者的主要觀點和結論是什麼？
-        - 文件中提到的建議有哪些？
-        """)
-    # 事件綁定
-    api_key_btn.click(set_api_key, inputs=api_key_input, outputs=api_key_status)
-    api_key_input.submit(set_api_key, inputs=api_key_input, outputs=api_key_status)
-    model_choice.change(set_model, inputs=model_choice, outputs=model_status)
-    summary_btn.click(generate_summary, inputs=pdf_upload, outputs=summary_output)
-    question_btn.click(ask_question, inputs=question_input, outputs=answer_output)
-    question_input.submit(ask_question, inputs=question_input, outputs=answer_output)
-    clear_btn.click(clear_all, outputs=[summary_output, question_input, answer_output])
 if __name__ == "__main__":
-    demo.launch(
-        show_error=True,
-        share=True,
-        server_name="0.0.0.0",
-        server_port=7860
-    )

 import openai
 import gradio as gr
+import fitz  # PyMuPDF
 from openai import OpenAI
 import traceback
         if not api_key:
             return "❌ API Key 不能為空"
+        # 支援新舊 key 格式
+        if not (api_key.startswith('sk-') or api_key.startswith('sk-proj-')):
+            return "❌ API Key 格式錯誤，必須以 'sk-' 或 'sk-proj-' 開頭"
         client = OpenAI(api_key=api_key)
         # 測試 API Key 是否有效
         test_response = client.chat.completions.create(
+            model="gpt-4",
+            messages=[{"role": "user", "content": "你好"}],
             max_tokens=5
         )
         return "✅ API Key 已設定並驗證成功！"
             return f"❌ API Key 設定失敗: {str(e)}"
 def set_model(model_name):
     global selected_model
     selected_model = model_name
     return f"✅ 模型已選擇：{model_name}"
 def extract_pdf_text(file_path):
     try:
         doc = fitz.open(file_path)
         text = ""
         return f"❌ PDF 解析錯誤: {str(e)}"
 def generate_summary(pdf_file):
     global summary_text, pdf_text
     if not client:
         return "❌ 請先設定 OpenAI API Key"
     if not pdf_file:
         return "❌ 請先上傳 PDF 文件"
     try:
         pdf_text = extract_pdf_text(pdf_file.name)
         if not pdf_text.strip():
             return "⚠️ 無法解析 PDF 文字，可能為純圖片 PDF 或空白文件。"
+        pdf_text_truncated = pdf_text[:8000]
         response = client.chat.completions.create(
             model=selected_model,
             messages=[
+                {"role": "system", "content": "請將以下 PDF 內容整理為條列式摘要，用繁體中文回答："},
                 {"role": "user", "content": pdf_text_truncated}
             ],
             temperature=0.3
         )
         summary_text = response.choices[0].message.content
         return summary_text
     except Exception as e:
+        print(traceback.format_exc())
         return f"❌ 摘要生成失敗: {str(e)}"
 def ask_question(user_question):
     if not client:
         return "❌ 請先設定 OpenAI API Key"
     if not summary_text and not pdf_text:
         return "❌ 請先生成 PDF 摘要"
     if not user_question.strip():
         return "❌ 請輸入問題"
     try:
         context = f"PDF 摘要:\n{summary_text}\n\n原始內容（部分）:\n{pdf_text[:2000]}"
         response = client.chat.completions.create(
             model=selected_model,
             messages=[
+                {"role": "system", "content": f"根據以下 PDF 內容回答問題，請用繁體中文回答：\n{context}"},
                 {"role": "user", "content": user_question}
             ],
             temperature=0.2
         )
         return response.choices[0].message.content
     except Exception as e:
+        print(traceback.format_exc())
         return f"❌ 問答生成失敗: {str(e)}"
 def clear_all():
     global summary_text, pdf_text
     summary_text = ""
     pdf_text = ""
     return "", "", ""
 with gr.Blocks(
     title="PDF 摘要助手",
+    css="""
+    .gradio-container {
+        max-width: none !important;
+        width: 100% !important;
+        background: linear-gradient(135deg, #667eea 0%, #764ba2 100%) !important;
+        min-height: 100vh;
+    }
+    .main-content {
+        max-width: 1600px !important;
+        margin: 20px auto !important;
+        padding: 30px !important;
+        background: rgba(255, 255, 255, 0.95) !important;
+        border-radius: 20px !important;
+    }
+    """
 ) as demo:
+    with gr.Column():
+        gr.Markdown("## 📄 PDF 摘要 & 問答助手")
+        with gr.Tab("🔧 設定"):
+            api_key_input = gr.Textbox(label="🔑 輸入 OpenAI API Key", type="password")
+            api_key_status = gr.Textbox(label="API 狀態", interactive=False, value="等待設定 API Key...")
+            api_key_btn = gr.Button("確認 API Key")
+            api_key_btn.click(set_api_key, inputs=api_key_input, outputs=api_key_status)
+            model_choice = gr.Radio(["gpt-4", "gpt-4.1", "gpt-4.5"], label="選擇 AI 模型", value="gpt-4")
+            model_status = gr.Textbox(label="模型狀態", interactive=False, value="✅ 已選擇：gpt-4")
+            model_choice.change(set_model, inputs=model_choice, outputs=model_status)
+        with gr.Tab("📄 摘要"):
+            pdf_upload = gr.File(label="上傳 PDF", file_types=[".pdf"])
+            summary_btn = gr.Button("生成摘要")
+            summary_output = gr.Textbox(label="PDF 摘要", lines=12)
+            summary_btn.click(generate_summary, inputs=pdf_upload, outputs=summary_output)
+        with gr.Tab("❓ 問答"):
+            question_input = gr.Textbox(label="請輸入問題", lines=2)
+            question_btn = gr.Button("送出問題")
+            answer_output = gr.Textbox(label="AI 回答", lines=8)
+            question_btn.click(ask_question, inputs=question_input, outputs=answer_output)
+            question_input.submit(ask_question, inputs=question_input, outputs=answer_output)
+        clear_btn = gr.Button("🗑️ 清除所有資料")
+        clear_btn.click(clear_all, outputs=[summary_output, question_input, answer_output])
 if __name__ == "__main__":
+    demo.launch(show_error=True)