File size: 447 Bytes
cd3e0b8
 
93c008b
cd3e0b8
 
 
 
 
 
f1e5728
cd3e0b8
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
# pdfsum.py
from PyPDF2 import PdfReader

def 提取_pdf文本(pdf_file):
    reader = PdfReader(pdf_file)
    texts = []
    for page in reader.pages:
        texts.append(page.extract_text() or "")
    return "\n".join(texts)

def 提取_pdf摘要(pdf_file, summarizer_func):
    text = 提取_pdf文本(pdf_file)
    if len(text.strip()) < 30:
        return "❌ 無法提取足夠文字內容"
    return summarizer_func(text)