PDF-resizer

Sleeping

App Files Files Community

soiz1 commited on Jul 11

Commit

99ee49c

verified ·

1 Parent(s): 308d902

Update app.py

Browse files

Files changed (1) hide show

app.py +39 -124

app.py CHANGED Viewed

@@ -1,135 +1,50 @@
 import gradio as gr
-import tempfile
 from pdf2image import convert_from_path
-import fitz  # PyMuPDF
-import cv2
-import numpy as np
-# ========== 解析ロジック関数 ==========
-def estimate_blurriness(pil_image):
-    """
-    ぼけ度を推定（Laplacian分散）
-    値が小さいほどぼけている
-    """
-    gray = np.array(pil_image.convert('L'))
-    return cv2.Laplacian(gray, cv2.CV_64F).var()
-def estimate_contrast(pil_image):
-    """
-    コントラストを推定（標準偏差）
-    値が小さいほどグレーでのっぺり
-    """
-    gray = np.array(pil_image.convert('L'))
-    return gray.std()
-def analyze_pdf(pdf_file):
-    """
-    アップロードされたPDFの各ページを画像に変換し
-    - 画像サイズ
-    - 総ピクセル数
-    - ぼけ度
-    - コントラスト
-    - 推定DPI
-    などをもとにAudiverisでの利用適性を判定
-    """
-    MAX_PIXELS_AUDIVERIS = 20_000_000
-    results = []
-    overall_rating = "OK"
-    try:
-        with tempfile.TemporaryDirectory() as tmpdir:
-            # PDF → 画像変換
-            images = convert_from_path(pdf_file.name, dpi=300, output_folder=tmpdir)
-            doc = fitz.open(pdf_file.name)
-            dpi_infos = []
-            for i, (img, page) in enumerate(zip(images, doc)):
-                width, height = img.size
-                total_pixels = width * height
-                reasons = []
-                page_rating = "OK"
-                # Audiverisのピクセル上限チェック
-                if total_pixels > MAX_PIXELS_AUDIVERIS:
-                    page_rating = "非推奨（画像が大きすぎる）"
-                    reasons.append(f"総ピクセル数 {total_pixels:,} > 20,000,000")
-                # 解像度チェック
-                if width < 1000 or height < 1000 and "非推奨" not in page_rating:
-                    page_rating = "非推奨（解像度が小さい）"
-                    reasons.append("幅または高さが1000px未満")
-                elif width < 1500 or height < 1500 and page_rating == "OK":
-                    page_rating = "注意（やや低め）"
-                # ぼけ度チェック
-                blur_score = estimate_blurriness(img)
-                if blur_score < 30 and "非推奨" not in page_rating:
-                    page_rating = "非推奨（ぼけている）"
-                    reasons.append(f"ぼけ度={blur_score:.1f}")
-                # コントラストチェック
-                contrast_score = estimate_contrast(img)
-                if contrast_score < 30 and "非推奨" not in page_rating:
-                    page_rating = "非推奨（コントラストが低い）"
-                    reasons.append(f"コントラスト={contrast_score:.1f}")
-                # DPI情報
-                rect = page.rect
-                width_pt = rect.width
-                height_pt = rect.height
-                dpi_x = width / (width_pt / 72)
-                dpi_y = height / (height_pt / 72)
-                dpi_infos.append(f"ページ{i+1}推定DPI: {dpi_x:.1f}x{dpi_y:.1f}")
-                # 理由をまとめる
-                reasons_str = "; ".join(reasons) if reasons else "条件クリア"
-                # ページ結果
-                results.append(
-                    f"ページ{i+1}: {width}x{height}px / ピクセル数={total_pixels:,} / "
-                    f"ぼけ度={blur_score:.1f} / コントラスト={contrast_score:.1f} → {page_rating} ({reasons_str})"
-                )
-                # 総合評価を更新
-                if "非推奨" in page_rating:
-                    overall_rating = "非推奨"
-                elif "注意" in page_rating and overall_rating == "OK":
-                    overall_rating = "注意"
-            # まとめテキスト
-            result_text = "\n".join(results + [""] + dpi_infos)
-            result_text += f"\n\n総合評価: {overall_rating}"
-            # 改善提案
-            if overall_rating == "非推奨":
-                result_text += "\n\n推奨対策: スキャン解像度を下げる・画像を縮小するなどして、ファイルサイズや画質を調整してください。"
-            return result_text, overall_rating
-    except Exception as e:
-        return f"処理中にエラーが発生しました: {str(e)}", "エラー"
-# ========== Gradio UI部分 ==========
 with gr.Blocks() as demo:
-    gr.Markdown("# 🎼 Audiveris適性チェック（非公式・推定）")
     gr.Markdown(
-        """
-        PDFをアップロードすると、ページごとの画像サイズ、ピクセル数、ぼけ度、コントラストを分析し、
-        Audiverisで使用可能かを「OK / 注意 / 非推奨」で推定します。
-        """
     )
     with gr.Row():
-        pdf_input = gr.File(label="PDFファイル")
-        analyze_button = gr.Button("判定")
-    result_output = gr.Textbox(label="詳細結果", lines=20)
-    rating_output = gr.Textbox(label="総合評価")
-    analyze_button.click(analyze_pdf, inputs=pdf_input, outputs=[result_output, rating_output])
-if __name__ == "__main__":
-    demo.launch()

 import gradio as gr
 from pdf2image import convert_from_path
+from PIL import Image
+import img2pdf
+import tempfile
+import os
+def downscale_pdf(pdf_file, max_width=3000, dpi=150):
+    with tempfile.TemporaryDirectory() as tmpdir:
+        # ステップ 1: PDF → 画像
+        images = convert_from_path(pdf_file.name, dpi=300, fmt='jpeg', output_folder=tmpdir)
+        downscaled_images = []
+        for i, img in enumerate(images):
+            w, h = img.size
+            total_px = w * h
+            print(f"Original Page {i+1}: {w}x{h} = {total_px}")
+            # サイズ制限
+            if w > max_width:
+                ratio = max_width / w
+                new_w = int(w * ratio)
+                new_h = int(h * ratio)
+                img = img.resize((new_w, new_h), Image.LANCZOS)
+                print(f"Downscaled Page {i+1}: {new_w}x{new_h} = {new_w * new_h}")
+            tmp_image_path = os.path.join(tmpdir, f"page_{i+1}.jpg")
+            img.save(tmp_image_path, "JPEG", quality=95)
+            downscaled_images.append(tmp_image_path)
+        # ステップ 2: 画像 → PDF
+        output_pdf_path = os.path.join(tmpdir, "downscaled.pdf")
+        with open(output_pdf_path, "wb") as f:
+            f.write(img2pdf.convert(downscaled_images))
+        return output_pdf_path
 with gr.Blocks() as demo:
+    gr.Markdown("## PDFダウンサイザー for Audiveris")
     gr.Markdown(
+        "PDFをアップロードすると、ページ画像を縮小してAudiveris向けに最適化したPDFを生成します。"
     )
     with gr.Row():
+        pdf_input = gr.File(label="PDFファイルをアップロード")
+        pdf_output = gr.File(label="変換後PDF")
+    convert_button = gr.Button("変換してダウンロード")
+    convert_button.click(fn=downscale_pdf, inputs=pdf_input, outputs=pdf_output)
+demo.launch()