Spaces:

ginigen
/

Book-Cover

Running on Zero

App Files Files Community

ginipick commited on 16 days ago

Commit

90456d7

verified ·

1 Parent(s): 289e506

Update app.py

Browse files

Files changed (1) hide show

app.py +132 -52

app.py CHANGED Viewed

@@ -86,56 +86,115 @@ def augment_prompt_with_llm(prompt):
         print(f"Error calling LLM API: {e}")
         return prompt
-def add_text_overlay(image, title_ko, title_en, author_ko, author_en,
-                    title_position, author_position, text_color):
-    """Add text overlay to the generated image"""
     # Create a copy of the image to work with
     img_with_text = image.copy()
     draw = ImageDraw.Draw(img_with_text)
-    # Try to load a better font, fallback to default if not available
-    try:
-        # You may need to adjust the font path based on your system
-        title_font_size = 48
-        author_font_size = 32
-        # For production, you'd want to include proper font files
-        title_font = ImageFont.truetype("/usr/share/fonts/truetype/liberation/LiberationSans-Bold.ttf", title_font_size)
-        author_font = ImageFont.truetype("/usr/share/fonts/truetype/liberation/LiberationSans-Regular.ttf", author_font_size)
-    except:
-        # Fallback to default font
-        title_font = ImageFont.load_default()
-        author_font = ImageFont.load_default()
     # Get image dimensions
     img_width, img_height = img_with_text.size
     # Define position mappings
     position_coords = {
-        "Top": (img_width // 2, img_height // 10),
-        "Center": (img_width // 2, img_height // 2),
-        "Bottom": (img_width // 2, img_height * 9 // 10)
     }
-    # Draw title
-    if title_ko or title_en:
-        title_text = f"{title_ko}\n{title_en}" if title_ko and title_en else title_ko or title_en
         title_x, title_y = position_coords[title_position]
         # Get text bbox for centering
-        bbox = draw.textbbox((0, 0), title_text, font=title_font)
         text_width = bbox[2] - bbox[0]
         text_height = bbox[3] - bbox[1]
         # Draw text with shadow for better visibility
         shadow_offset = 2
         draw.text((title_x - text_width // 2 + shadow_offset, title_y - text_height // 2 + shadow_offset),
-                 title_text, font=title_font, fill="black", align="center")
         draw.text((title_x - text_width // 2, title_y - text_height // 2),
-                 title_text, font=title_font, fill=text_color, align="center")
-    # Draw author
-    if author_ko or author_en:
-        author_text = f"{author_ko}\n{author_en}" if author_ko and author_en else author_ko or author_en
         author_x, author_y = position_coords[author_position]
         # Get text bbox for centering
@@ -145,9 +204,9 @@ def add_text_overlay(image, title_ko, title_en, author_ko, author_en,
         # Draw text with shadow
         draw.text((author_x - text_width // 2 + shadow_offset, author_y - text_height // 2 + shadow_offset),
-                 author_text, font=author_font, fill="black", align="center")
         draw.text((author_x - text_width // 2, author_y - text_height // 2),
-                 author_text, font=author_font, fill=text_color, align="center")
     return img_with_text
@@ -194,12 +253,13 @@ def inference(
     num_inference_steps: int,
     lora_scale: float,
     title_ko: str,
-    title_en: str,
     author_ko: str,
-    author_en: str,
     title_position: str,
     author_position: str,
     text_color: str,
     progress: gr.Progress = gr.Progress(track_tqdm=True),
 ):
     if randomize_seed:
@@ -216,10 +276,11 @@ def inference(
         joint_attention_kwargs={"scale": lora_scale},
     ).images[0]
-    # Add text overlay if any text is provided
-    if any([title_ko, title_en, author_ko, author_en]):
-        image = add_text_overlay(image, title_ko, title_en, author_ko, author_en,
-                               title_position, author_position, text_color)
     # Save the generated image
     filepath = save_generated_image(image, prompt)
@@ -278,29 +339,47 @@ with gr.Blocks(theme=gr.themes.Soft(), analytics_enabled=False) as demo:
                     value=DEFAULT_IMAGE_PATH  # Set the default image
                 )
-                with gr.Accordion("Text Overlay Settings", open=False):
                     with gr.Row():
                         with gr.Column():
-                            title_ko = gr.Textbox(label="Title (Korean)", placeholder="한글 제목")
-                            title_en = gr.Textbox(label="Title (English)", placeholder="English Title")
                             title_position = gr.Radio(
-                                label="Title Position",
-                                choices=["Top", "Center", "Bottom"],
-                                value="Top"
                             )
                         with gr.Column():
-                            author_ko = gr.Textbox(label="Author (Korean)", placeholder="지은이")
-                            author_en = gr.Textbox(label="Author (English)", placeholder="Author Name")
                             author_position = gr.Radio(
-                                label="Author Position",
-                                choices=["Top", "Center", "Bottom"],
-                                value="Bottom"
                             )
-                    text_color = gr.ColorPicker(
-                        label="Text Color",
-                        value="#FFFFFF"
-                    )
                 with gr.Accordion("Advanced Settings", open=False):
                     seed = gr.Slider(
@@ -412,12 +491,13 @@ with gr.Blocks(theme=gr.themes.Soft(), analytics_enabled=False) as demo:
             num_inference_steps,
             lora_scale,
             title_ko,
-            title_en,
             author_ko,
-            author_en,
             title_position,
             author_position,
             text_color,
         ],
         outputs=[result, seed, generated_gallery],
     )

         print(f"Error calling LLM API: {e}")
         return prompt
+def get_korean_font(font_name, font_size):
+    """Get Korean font based on font name"""
+    font_paths = {
+        "나눔고딕": [
+            "/usr/share/fonts/truetype/nanum/NanumGothic.ttf",
+            "NanumGothic.ttf",
+            "/System/Library/Fonts/AppleSDGothicNeo.ttc",  # macOS
+            "C:/Windows/Fonts/NanumGothic.ttf",  # Windows
+        ],
+        "나눔명조": [
+            "/usr/share/fonts/truetype/nanum/NanumMyeongjo.ttf",
+            "NanumMyeongjo.ttf",
+            "C:/Windows/Fonts/NanumMyeongjo.ttf",  # Windows
+        ],
+        "맑은 고딕": [
+            "/usr/share/fonts/truetype/malgun/malgun.ttf",
+            "malgun.ttf",
+            "/System/Library/Fonts/AppleMyungjo.ttf",  # macOS
+            "C:/Windows/Fonts/malgun.ttf",  # Windows
+        ],
+        "바탕": [
+            "/usr/share/fonts/truetype/batang/batang.ttf",
+            "batang.ttf",
+            "C:/Windows/Fonts/batang.ttc",  # Windows
+        ],
+        "돋움": [
+            "/usr/share/fonts/truetype/dotum/dotum.ttf",
+            "dotum.ttf",
+            "C:/Windows/Fonts/dotum.ttc",  # Windows
+        ],
+        "기본": []
+    }
+    # Try to load the selected font
+    if font_name in font_paths:
+        for font_path in font_paths[font_name]:
+            try:
+                return ImageFont.truetype(font_path, font_size)
+            except:
+                continue
+    # Try common font directories
+    common_paths = [
+        f"/usr/share/fonts/truetype/{font_name.lower()}/{font_name}.ttf",
+        f"fonts/{font_name}.ttf",
+        f"{font_name}.ttf",
+    ]
+    for path in common_paths:
+        try:
+            return ImageFont.truetype(path, font_size)
+        except:
+            continue
+    # Fallback to default font with larger size
+    try:
+        return ImageFont.truetype("DejaVuSans.ttf", font_size)
+    except:
+        # Use default font but try to make it larger
+        default = ImageFont.load_default()
+        # PIL default font is very small, so we might need to scale the text
+        return default
+def add_text_overlay(image, title_ko, author_ko,
+                    title_position, author_position, text_color, font_name,
+                    title_size, author_size):
+    """Add Korean text overlay to the generated image"""
     # Create a copy of the image to work with
     img_with_text = image.copy()
     draw = ImageDraw.Draw(img_with_text)
+    # Load Korean fonts with custom sizes
+    title_font = get_korean_font(font_name, title_size)
+    author_font = get_korean_font(font_name, author_size)
     # Get image dimensions
     img_width, img_height = img_with_text.size
     # Define position mappings
     position_coords = {
+        "상단": (img_width // 2, img_height // 10),
+        "중앙": (img_width // 2, img_height // 2),
+        "하단": (img_width // 2, img_height * 9 // 10)
     }
+    # Draw title (Korean only)
+    if title_ko:
         title_x, title_y = position_coords[title_position]
         # Get text bbox for centering
+        bbox = draw.textbbox((0, 0), title_ko, font=title_font)
         text_width = bbox[2] - bbox[0]
         text_height = bbox[3] - bbox[1]
         # Draw text with shadow for better visibility
         shadow_offset = 2
         draw.text((title_x - text_width // 2 + shadow_offset, title_y - text_height // 2 + shadow_offset),
+                 title_ko, font=title_font, fill="black")
         draw.text((title_x - text_width // 2, title_y - text_height // 2),
+                 title_ko, font=title_font, fill=text_color)
+    # Draw author (Korean only)
+    if author_ko:
+        # Add "지은이: " prefix if not already present
+        if not author_ko.startswith("지은이"):
+            author_text = f"지은이: {author_ko}"
+        else:
+            author_text = author_ko
         author_x, author_y = position_coords[author_position]
         # Get text bbox for centering
         # Draw text with shadow
         draw.text((author_x - text_width // 2 + shadow_offset, author_y - text_height // 2 + shadow_offset),
+                 author_text, font=author_font, fill="black")
         draw.text((author_x - text_width // 2, author_y - text_height // 2),
+                 author_text, font=author_font, fill=text_color)
     return img_with_text
     num_inference_steps: int,
     lora_scale: float,
     title_ko: str,
     author_ko: str,
     title_position: str,
     author_position: str,
     text_color: str,
+    font_name: str,
+    title_size: int,
+    author_size: int,
     progress: gr.Progress = gr.Progress(track_tqdm=True),
 ):
     if randomize_seed:
         joint_attention_kwargs={"scale": lora_scale},
     ).images[0]
+    # Add text overlay if any Korean text is provided
+    if title_ko or author_ko:
+        image = add_text_overlay(image, title_ko, author_ko,
+                               title_position, author_position, text_color, font_name,
+                               title_size, author_size)
     # Save the generated image
     filepath = save_generated_image(image, prompt)
                     value=DEFAULT_IMAGE_PATH  # Set the default image
                 )
+                with gr.Accordion("Text Overlay Settings (한글)", open=False):
                     with gr.Row():
                         with gr.Column():
+                            title_ko = gr.Textbox(label="제목", placeholder="한글 제목을 입력하세요")
                             title_position = gr.Radio(
+                                label="제목 위치",
+                                choices=["상단", "중앙", "하단"],
+                                value="상단"
+                            )
+                            title_size = gr.Slider(
+                                label="제목 글자 크기",
+                                minimum=20,
+                                maximum=100,
+                                value=48,
+                                step=2
                             )
                         with gr.Column():
+                            author_ko = gr.Textbox(label="지은이", placeholder="지은이 이름을 입력하세요")
                             author_position = gr.Radio(
+                                label="지은이 위치",
+                                choices=["상단", "중앙", "하단"],
+                                value="하단"
+                            )
+                            author_size = gr.Slider(
+                                label="지은이 글자 크기",
+                                minimum=16,
+                                maximum=60,
+                                value=32,
+                                step=2
                             )
+                    with gr.Row():
+                        font_name = gr.Dropdown(
+                            label="폰트 선택",
+                            choices=["나눔고딕", "나눔명조", "맑은 고딕", "바탕", "돋움", "기본"],
+                            value="나눔고딕"
+                        )
+                        text_color = gr.ColorPicker(
+                            label="글자 색상",
+                            value="#FFFFFF"
+                        )
                 with gr.Accordion("Advanced Settings", open=False):
                     seed = gr.Slider(
             num_inference_steps,
             lora_scale,
             title_ko,
             author_ko,
             title_position,
             author_position,
             text_color,
+            font_name,
+            title_size,
+            author_size,
         ],
         outputs=[result, seed, generated_gallery],
     )