File size: 7,093 Bytes
4eeb4da
9b64245
8f38a6d
f7e2faa
 
8f38a6d
f7e2faa
9b64245
8f38a6d
 
 
 
 
 
 
 
 
 
 
 
30a1cae
8f38a6d
30a1cae
8f38a6d
30a1cae
f4892cf
9b64245
f7e2faa
f4892cf
f7e2faa
 
30a1cae
f4892cf
30a1cae
f7e2faa
30a1cae
f4892cf
f7e2faa
f4892cf
30a1cae
f7e2faa
 
30a1cae
 
 
 
 
 
f7e2faa
30a1cae
 
 
 
 
9b64245
30a1cae
 
9b64245
30a1cae
 
 
 
 
 
 
 
 
 
 
 
 
9b64245
30a1cae
f7e2faa
30a1cae
 
f7e2faa
30a1cae
 
9b64245
30a1cae
 
 
9b64245
 
30a1cae
 
 
 
 
 
 
 
 
 
 
 
12f8f41
30a1cae
 
 
12f8f41
30a1cae
 
 
f7e2faa
 
 
 
 
30a1cae
 
 
 
9763e73
30a1cae
 
f7e2faa
 
 
 
30a1cae
 
 
 
 
 
 
 
 
 
f7e2faa
30a1cae
 
 
 
 
9b64245
f7e2faa
 
 
 
 
8861022
f7e2faa
 
 
 
 
 
 
 
 
 
 
 
 
 
 
8861022
f7e2faa
9b64245
 
 
30a1cae
 
 
 
 
f7e2faa
30a1cae
 
 
 
f7e2faa
 
 
30a1cae
 
9b64245
30a1cae
f4892cf
30a1cae
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
import os
import gradio as gr
from PIL import Image, ImageDraw, ImageFont
import base64
import io

# --- Image Generation Logic ---

def draw_horizontal_lines(draw, width, height, spacing=60, color=(230, 230, 230)):
    """Draws horizontal lines on the image."""
    for y in range(0, height, spacing):
        draw.line([(0, y), (width, y)], fill=color, width=2)

def draw_dot_grid(draw, width, height, spacing=50, color=(220, 220, 220)):
    """Draws a dot grid on the image."""
    for x in range(0, width, spacing):
        for y in range(0, height, spacing):
            draw.ellipse([(x-2, y-2), (x+2, y+2)], fill=color)

def draw_lattice_grid(draw, width, height, spacing=100, color=(235, 235, 235)):
    """Draws a lattice/graph paper grid on the image."""
    for x in range(0, width, spacing):
        draw.line([(x, 0), (x, height)], fill=color, width=2)
    for y in range(0, height, spacing):
        draw.line([(0, y), (width, y)], fill=color, width=2)


def text_to_base64_images_generator(text_content, style='lines'):
    """
    Converts text into a series of images and returns them as a list
    of base64 encoded strings, suitable for an API/MCP client.

    Args:
        text_content (str): The text to be converted.
        style (str, optional): The background style ('plain', 'lines', 'dots', 'grid').

    Returns:
        list: A list of base64 encoded PNG image strings.
    """
    if not text_content or not text_content.strip():
        gr.Warning("Input text is empty. Please enter some text to generate images.")
        return []

    # --- Configuration ---
    IMG_WIDTH = 1080
    IMG_HEIGHT = 1080
    BACKGROUND_COLOR = (255, 255, 255)
    TEXT_COLOR = (10, 10, 10)
    STYLE_COLOR = (225, 225, 225)
    
    PADDING_X = 80
    PADDING_Y = 80
    FONT_SIZE = 48
    LINE_SPACING = 20
    
    # --- Font Loading ---
    font = None
    try:
        font_paths_to_try = [
            "Arial.ttf", "arial.ttf", "DejaVuSans.ttf",
            "/System/Library/Fonts/Supplemental/Arial.ttf",
            "/usr/share/fonts/truetype/liberation/LiberationSans-Regular.ttf",
            "/usr/share/fonts/truetype/dejavu/DejaVuSans.ttf"
        ]
        for f_path in font_paths_to_try:
            try:
                font = ImageFont.truetype(f_path, FONT_SIZE)
                break
            except IOError:
                continue
        if not font:
            font = ImageFont.load_default()
    except Exception as e:
        print(f"Font loading error: {e}")
        font = ImageFont.load_default()

    # --- Text Wrapping ---
    drawable_width = IMG_WIDTH - 2 * PADDING_X
    paragraphs = [p.strip() for p in text_content.strip().split('\n') if p.strip()]
    
    all_lines_and_breaks = []
    for i, paragraph in enumerate(paragraphs):
        words = paragraph.split()
        current_line = ""
        for word in words:
            if font.getlength(word) > drawable_width:
                temp_word = ""
                for char in word:
                    if font.getlength(temp_word + char) > drawable_width:
                        all_lines_and_breaks.append(temp_word)
                        temp_word = char
                    else:
                        temp_word += char
                word = temp_word

            if font.getlength(current_line + " " + word) <= drawable_width:
                current_line += " " + word
            else:
                all_lines_and_breaks.append(current_line.strip())
                current_line = word
        all_lines_and_breaks.append(current_line.strip())
        
        if i < len(paragraphs) - 1:
            all_lines_and_breaks.append(None)

    # --- Image Generation & Encoding ---
    generated_base64_list = []
    page_content = []
    y_text = PADDING_Y
    
    try:
        line_height = font.getbbox("A")[3] - font.getbbox("A")[1]
    except AttributeError:
        line_height = 12
    
    PARAGRAPH_SPACING = line_height

    def create_and_encode_page(content):
        """Helper to create a PIL image, draw text, and encode to base64."""
        img = Image.new('RGB', (IMG_WIDTH, IMG_HEIGHT), color=BACKGROUND_COLOR)
        draw = ImageDraw.Draw(img)

        if style == 'lines':
            line_style_spacing = line_height + LINE_SPACING
            draw_horizontal_lines(draw, IMG_WIDTH, IMG_HEIGHT, spacing=line_style_spacing, color=STYLE_COLOR)
        elif style == 'dots':
            draw_dot_grid(draw, IMG_WIDTH, IMG_HEIGHT, color=STYLE_COLOR)
        elif style == 'grid':
            draw_lattice_grid(draw, IMG_WIDTH, IMG_HEIGHT, color=STYLE_COLOR)

        current_y = PADDING_Y
        for page_item in content:
            if page_item is not None:
                draw.text((PADDING_X, current_y), page_item, font=font, fill=TEXT_COLOR)
                current_y += line_height + LINE_SPACING
            else:
                current_y += PARAGRAPH_SPACING
        
        # Encode image to base64 string
        buffered = io.BytesIO()
        img.save(buffered, format="PNG")
        img_base64 = base64.b64encode(buffered.getvalue()).decode("utf-8")
        generated_base64_list.append(img_base64)

    # --- Page Creation Loop ---
    for item in all_lines_and_breaks:
        is_break = item is None
        item_height = PARAGRAPH_SPACING if is_break else line_height
        
        if y_text + item_height > IMG_HEIGHT - PADDING_Y:
            create_and_encode_page(page_content)
            page_content = [item]
            y_text = PADDING_Y + item_height + (0 if is_break else LINE_SPACING)
        else:
            page_content.append(item)
            y_text += item_height + (0 if is_break else LINE_SPACING)
            
    if page_content:
        create_and_encode_page(page_content)

    return generated_base64_list

# --- Gradio Interface ---

example_text = """In the heart of a bustling city, there lived a clockmaker named Alistair. His shop, a quaint corner of tranquility amidst the urban chaos, was filled with the gentle ticking of countless timepieces. Each clock was a masterpiece, a testament to his dedication and skill.

One day, a young girl with eyes as curious as a cat's wandered into his shop. She wasn't interested in the shiny new watches but was drawn to the grandfather clock in the corner. "What's its story?" she asked, her voice soft. Alistair smiled, for he knew he had found the next guardian of the stories. The legacy of the whispering clock would live on."""

demo = gr.Interface(
    fn=text_to_base64_images_generator,
    inputs=[
        gr.Textbox(lines=15, label="Text Content", placeholder="Paste your long-form text here...", value=example_text),
        gr.Radio(['lines', 'dots', 'grid', 'plain'], label="Background Style", value='lines')
    ],
    outputs=gr.JSON(label="Base64 Encoded Images"),
    title="Text-to-Image API Server",
    description="Transforms long-form text into a series of images and returns a JSON list of base64-encoded strings.",
    allow_flagging="never"
)

# --- Main Execution ---
if __name__ == "__main__":
    demo.launch(mcp_server=True)