Book-Maker-CVLM-AI-UI-UX

Sleeping

App Files Files Community

awacke1 commited on 10 days ago

Commit

1f34dc9

verified ·

1 Parent(s): f258b94

Update app.py

Browse files

Files changed (1) hide show

app.py +28 -56

app.py CHANGED Viewed

@@ -27,8 +27,8 @@ LAYOUTS = {
 OUTPUT_DIR = Path("generated_pdfs")
 OUTPUT_DIR.mkdir(exist_ok=True)
-# Path for the required emoji font file
-EMOJI_FONT_PATH = Path("NotoColorEmoji-Regular.ttf")
 # Regex to find and wrap emojis for ReportLab
 EMOJI_PATTERN = re.compile(
@@ -52,7 +52,6 @@ EMOJI_PATTERN = re.compile(
 class PDFGenerator:
     """
-    An object-oriented approach to generating PDFs.
     Handles font registration, markdown parsing, and PDF creation.
     """
     def __init__(self, font_path: Path):
@@ -69,9 +68,8 @@ class PDFGenerator:
         Registers the TTF font file with ReportLab if the file exists.
         """
         if font_path.exists():
-            pdfmetrics.registerFont(TTFont(self.emoji_font_name, font_path))
         else:
-            # Provide a helpful error in the web app if the font is missing
             st.error(f"Emoji font not found at '{font_path}'. Emojis will not be rendered. Please download it.")
             self.emoji_font_name = "Helvetica" # Fallback to a standard font
@@ -80,11 +78,8 @@ class PDFGenerator:
         😀 To make emojis appear so grand, wrap them with a font command.
         Finds all emojis and wraps them in ReportLab <font> tags.
         """
-        # If the emoji font failed to register, don't try to use it.
         if self.emoji_font_name != "NotoEmoji":
             return text
-        # The lambda function takes each matched emoji (m) and wraps it.
         return EMOJI_PATTERN.sub(lambda m: f'<font name="{self.emoji_font_name}">{m.group(0)}</font>', text)
     def _markdown_to_story(self, markdown_text: str) -> list:
@@ -93,13 +88,10 @@ class PDFGenerator:
         Converts a markdown string 📝 into a list of ReportLab Flowables (a 'story').
         """
         styles = getSampleStyleSheet()
-        # Define custom styles for different markdown elements
         style_normal = styles['BodyText']
         style_h1 = styles['h1']
         style_h2 = styles['h2']
         style_h3 = styles['h3']
-        # Use a monospaced font for code blocks
         style_code = ParagraphStyle('Code', parent=styles['Normal'], fontName='Courier', textColor=colors.darkred)
         story = []
@@ -108,7 +100,6 @@ class PDFGenerator:
         code_block_text = ""
         for line in lines:
-            # Handle code blocks (```)
             if line.strip().startswith("```"):
                 if in_code_block:
                     story.append(Paragraph(code_block_text, style_code))
@@ -119,33 +110,35 @@ class PDFGenerator:
                 continue
             if in_code_block:
-                # Escape HTML-sensitive characters and preserve line breaks within code
                 escaped_line = line.replace('&', '&amp;').replace('<', '&lt;').replace('>', '&gt;')
                 code_block_text += escaped_line + '<br/>'
                 continue
-            # This is where we process each line for emojis BEFORE creating a Paragraph
-            processed_line = self._wrap_emojis_for_reportlab(line)
-            # Handle markdown syntax
-            if processed_line.startswith("# "):
-                story.append(Paragraph(self._wrap_emojis_for_reportlab(processed_line[2:]), style_h1))
-            elif processed_line.startswith("## "):
-                story.append(Paragraph(self._wrap_emojis_for_reportlab(processed_line[3:]), style_h2))
-            elif processed_line.startswith("### "):
-                story.append(Paragraph(self._wrap_emojis_for_reportlab(processed_line[4:]), style_h3))
-            elif processed_line.strip().startswith(("* ", "- ")):
-                story.append(Paragraph(f"• {self._wrap_emojis_for_reportlab(processed_line.strip()[2:])}", style_normal))
-            elif re.match(r'^\d+\.\s', processed_line.strip()):
-                story.append(Paragraph(processed_line.strip(), style_normal))
-            elif processed_line.strip() == "":
                 story.append(Spacer(1, 0.2 * inch))
             else:
-                # Handle bold (**) and italics (_) using ReportLab's rich text tags
-                formatted_line = re.sub(r'\*\*(.*?)\*\*', r'<b>\1</b>', processed_line)
                 formatted_line = re.sub(r'_(.*?)_', r'<i>\1</i>', formatted_line)
-                story.append(Paragraph(formatted_line, style_normal))
         return story
     def create_pdf(self, md_asset: Path, layout_name: str, layout_properties: dict):
@@ -155,26 +148,18 @@ class PDFGenerator:
         """
         try:
             md_content = md_asset.read_text(encoding="utf-8")
             date_str = datetime.datetime.now().strftime("%Y-%m-%d")
             output_filename = f"{md_asset.stem}_{layout_name.replace(' ', '-')}_{date_str}.pdf"
             output_path = OUTPUT_DIR / output_filename
-            # The SimpleDocTemplate handles the page creation and content flow
             doc = SimpleDocTemplate(
                 str(output_path),
                 pagesize=layout_properties.get("size", A4),
-                rightMargin=inch,
-                leftMargin=inch,
-                topMargin=inch,
-                bottomMargin=inch
             )
             story = self._markdown_to_story(md_content)
-            # The .build() method takes the story and renders the PDF
             doc.build(story)
         except Exception as e:
             st.error(f"Failed to process {md_asset.name} with ReportLab: {e}")
@@ -184,7 +169,6 @@ class PDFGenerator:
 def get_file_download_link(file_path: Path) -> str:
     """
     🔗 To grab your file and not delay, a special link is paved today.
-    Generates a base64-encoded download link for a file.
     """
     with open(file_path, "rb") as f:
         data = base64.b64encode(f.read()).decode()
@@ -193,10 +177,8 @@ def get_file_download_link(file_path: Path) -> str:
 def display_file_explorer():
     """
     📂 To see your files, both old and new, this handy explorer gives a view.
-    Renders a simple file explorer in the Streamlit app for MD and PDF files.
     """
     st.header("📂 File Explorer")
     st.subheader("Source Markdown Files (.md)")
     md_files = list(Path(".").glob("*.md"))
     if not md_files:
@@ -210,7 +192,6 @@ def display_file_explorer():
                 st.markdown(get_file_download_link(md_file), unsafe_allow_html=True)
     st.subheader("Generated PDF Files")
-    # Sort PDFs by modification time to show the newest first
     pdf_files = sorted(list(OUTPUT_DIR.glob("*.pdf")), key=lambda p: p.stat().st_mtime, reverse=True)
     if not pdf_files:
         st.info("No PDFs generated yet. Click the button above to start.")
@@ -222,7 +203,6 @@ def display_file_explorer():
             with col2:
                 st.markdown(get_file_download_link(pdf_file), unsafe_allow_html=True)
 # --- Main App Execution ---
 def main():
@@ -233,41 +213,33 @@ def main():
     st.title("📄 Markdown to PDF Generator")
     st.markdown("This tool converts all `.md` files in this directory to PDF. It now supports emojis! 👍")
-    # Create a sample markdown file if none exist, to help new users.
-    if not list(Path(".").glob("*.md")):
         with open("sample.md", "w", encoding="utf-8") as f:
             f.write("# Sample Document 👍\n\nThis is a sample markdown file. **ReportLab** is creating the PDF. Emojis like 🚀 and 💡 should now appear correctly.\n\n### Features\n- Item 1\n- Item 2\n\n```\ndef hello_world():\n    print(\"Hello, PDF! 👋\")\n```\n")
         st.rerun()
-    # Instantiate our generator. It will handle font setup on its own.
     pdf_generator = PDFGenerator(EMOJI_FONT_PATH)
     if st.button("🚀 Generate PDFs from all Markdown Files", type="primary"):
         markdown_files = list(Path(".").glob("*.md"))
         if not markdown_files:
             st.warning("No `.md` files found. Please add a markdown file to the directory.")
         else:
             total_pdfs = len(markdown_files) * len(LAYOUTS)
             progress_bar = st.progress(0, text="Starting PDF generation...")
             pdf_count = 0
             with st.spinner("Generating PDFs... Please wait."):
                 for md_file in markdown_files:
                     st.info(f"Processing: **{md_file.name}**")
                     for name, properties in LAYOUTS.items():
-                        # Use the instance method to create the PDF
                         pdf_generator.create_pdf(md_file, name, properties)
                         pdf_count += 1
                         progress_bar.progress(pdf_count / total_pdfs, f"Generated {pdf_count}/{total_pdfs} PDFs...")
             st.success("✅ PDF generation complete!")
             st.balloons()
-            # Rerun to refresh the file explorer immediately
             st.rerun()
     display_file_explorer()
 if __name__ == "__main__":
     main()

 OUTPUT_DIR = Path("generated_pdfs")
 OUTPUT_DIR.mkdir(exist_ok=True)
+# ⚠️ UPDATED: Path for the required NON-COLOR emoji font file.
+EMOJI_FONT_PATH = Path("NotoEmoji-Regular.ttf")
 # Regex to find and wrap emojis for ReportLab
 EMOJI_PATTERN = re.compile(
 class PDFGenerator:
     """
     Handles font registration, markdown parsing, and PDF creation.
     """
     def __init__(self, font_path: Path):
         Registers the TTF font file with ReportLab if the file exists.
         """
         if font_path.exists():
+            pdfmetrics.registerFont(TTFont(self.emoji_font_name, str(font_path)))
         else:
             st.error(f"Emoji font not found at '{font_path}'. Emojis will not be rendered. Please download it.")
             self.emoji_font_name = "Helvetica" # Fallback to a standard font
         😀 To make emojis appear so grand, wrap them with a font command.
         Finds all emojis and wraps them in ReportLab <font> tags.
         """
         if self.emoji_font_name != "NotoEmoji":
             return text
         return EMOJI_PATTERN.sub(lambda m: f'<font name="{self.emoji_font_name}">{m.group(0)}</font>', text)
     def _markdown_to_story(self, markdown_text: str) -> list:
         Converts a markdown string 📝 into a list of ReportLab Flowables (a 'story').
         """
         styles = getSampleStyleSheet()
         style_normal = styles['BodyText']
         style_h1 = styles['h1']
         style_h2 = styles['h2']
         style_h3 = styles['h3']
         style_code = ParagraphStyle('Code', parent=styles['Normal'], fontName='Courier', textColor=colors.darkred)
         story = []
         code_block_text = ""
         for line in lines:
             if line.strip().startswith("```"):
                 if in_code_block:
                     story.append(Paragraph(code_block_text, style_code))
                 continue
             if in_code_block:
                 escaped_line = line.replace('&', '&amp;').replace('<', '&lt;').replace('>', '&gt;')
                 code_block_text += escaped_line + '<br/>'
                 continue
+            # Process the line for markdown syntax first
+            if line.startswith("# "):
+                final_text = self._wrap_emojis_for_reportlab(line[2:])
+                story.append(Paragraph(final_text, style_h1))
+            elif line.startswith("## "):
+                final_text = self._wrap_emojis_for_reportlab(line[3:])
+                story.append(Paragraph(final_text, style_h2))
+            elif line.startswith("### "):
+                final_text = self._wrap_emojis_for_reportlab(line[4:])
+                story.append(Paragraph(final_text, style_h3))
+            elif line.strip().startswith(("* ", "- ")):
+                final_text = self._wrap_emojis_for_reportlab(line.strip()[2:])
+                story.append(Paragraph(f"• {final_text}", style_normal))
+            elif re.match(r'^\d+\.\s', line.strip()):
+                final_text = self._wrap_emojis_for_reportlab(line.strip())
+                story.append(Paragraph(final_text, style_normal))
+            elif line.strip() == "":
                 story.append(Spacer(1, 0.2 * inch))
             else:
+                # Handle bold/italics, then wrap emojis in the final string
+                formatted_line = re.sub(r'\*\*(.*?)\*\*', r'<b>\1</b>', line)
                 formatted_line = re.sub(r'_(.*?)_', r'<i>\1</i>', formatted_line)
+                final_text = self._wrap_emojis_for_reportlab(formatted_line)
+                story.append(Paragraph(final_text, style_normal))
         return story
     def create_pdf(self, md_asset: Path, layout_name: str, layout_properties: dict):
         """
         try:
             md_content = md_asset.read_text(encoding="utf-8")
             date_str = datetime.datetime.now().strftime("%Y-%m-%d")
             output_filename = f"{md_asset.stem}_{layout_name.replace(' ', '-')}_{date_str}.pdf"
             output_path = OUTPUT_DIR / output_filename
             doc = SimpleDocTemplate(
                 str(output_path),
                 pagesize=layout_properties.get("size", A4),
+                rightMargin=inch, leftMargin=inch,
+                topMargin=inch, bottomMargin=inch
             )
             story = self._markdown_to_story(md_content)
             doc.build(story)
         except Exception as e:
             st.error(f"Failed to process {md_asset.name} with ReportLab: {e}")
 def get_file_download_link(file_path: Path) -> str:
     """
     🔗 To grab your file and not delay, a special link is paved today.
     """
     with open(file_path, "rb") as f:
         data = base64.b64encode(f.read()).decode()
 def display_file_explorer():
     """
     📂 To see your files, both old and new, this handy explorer gives a view.
     """
     st.header("📂 File Explorer")
     st.subheader("Source Markdown Files (.md)")
     md_files = list(Path(".").glob("*.md"))
     if not md_files:
                 st.markdown(get_file_download_link(md_file), unsafe_allow_html=True)
     st.subheader("Generated PDF Files")
     pdf_files = sorted(list(OUTPUT_DIR.glob("*.pdf")), key=lambda p: p.stat().st_mtime, reverse=True)
     if not pdf_files:
         st.info("No PDFs generated yet. Click the button above to start.")
             with col2:
                 st.markdown(get_file_download_link(pdf_file), unsafe_allow_html=True)
 # --- Main App Execution ---
 def main():
     st.title("📄 Markdown to PDF Generator")
     st.markdown("This tool converts all `.md` files in this directory to PDF. It now supports emojis! 👍")
+    if not any(Path(".").glob("*.md")):
         with open("sample.md", "w", encoding="utf-8") as f:
             f.write("# Sample Document 👍\n\nThis is a sample markdown file. **ReportLab** is creating the PDF. Emojis like 🚀 and 💡 should now appear correctly.\n\n### Features\n- Item 1\n- Item 2\n\n```\ndef hello_world():\n    print(\"Hello, PDF! 👋\")\n```\n")
         st.rerun()
     pdf_generator = PDFGenerator(EMOJI_FONT_PATH)
     if st.button("🚀 Generate PDFs from all Markdown Files", type="primary"):
         markdown_files = list(Path(".").glob("*.md"))
         if not markdown_files:
             st.warning("No `.md` files found. Please add a markdown file to the directory.")
         else:
             total_pdfs = len(markdown_files) * len(LAYOUTS)
             progress_bar = st.progress(0, text="Starting PDF generation...")
             pdf_count = 0
             with st.spinner("Generating PDFs... Please wait."):
                 for md_file in markdown_files:
                     st.info(f"Processing: **{md_file.name}**")
                     for name, properties in LAYOUTS.items():
                         pdf_generator.create_pdf(md_file, name, properties)
                         pdf_count += 1
                         progress_bar.progress(pdf_count / total_pdfs, f"Generated {pdf_count}/{total_pdfs} PDFs...")
             st.success("✅ PDF generation complete!")
             st.balloons()
             st.rerun()
     display_file_explorer()
 if __name__ == "__main__":
     main()