File size: 7,160 Bytes
61c89cd
 
 
4deddd3
e21a983
 
 
 
 
9c588a7
e21a983
 
 
fb14070
 
ce2ea41
8faa958
61c89cd
 
 
fb4e2c7
06d3f6e
e21a983
 
 
 
77e3da3
70bd56f
b0bb2c9
6db6a8d
61c89cd
 
9d3a848
 
302bc3b
b32fdcf
302bc3b
9d3a848
 
 
 
6db6a8d
 
205077f
 
 
 
b32fdcf
e453455
b0bb2c9
552490f
6db6a8d
 
965e92d
967bc0b
 
e453455
f3a00bf
562b4d5
6db6a8d
 
3b90fe5
552490f
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
3b90fe5
552490f
 
 
 
 
 
 
 
 
 
 
 
3b90fe5
7985d5f
552490f
 
fef1dcd
 
 
 
a5c674b
fef1dcd
 
 
 
fb4e2c7
fef1dcd
 
 
 
a5c674b
fef1dcd
 
 
 
552490f
 
 
688d8e9
e7348c9
fe55e41
ffe6ef9
e7348c9
fb14070
98ac56e
ce2ea41
b1aeecd
ce2ea41
b1aeecd
 
 
5cb26b4
9d7dc73
5cb26b4
 
 
 
 
fc523d1
a99276a
b4f9b4b
b8d8aa1
ce2ea41
f3a00bf
 
8a2ea7d
b32fdcf
8a2ea7d
 
f1deaa5
b32fdcf
e7149a6
8a2ea7d
3aaecd5
f3a00bf
4afc319
f3a00bf
c2185df
f3a00bf
 
 
 
b06f535
5cb26b4
f3a00bf
b1aeecd
b32fdcf
 
572edec
eebdd59
572edec
b32fdcf
843e793
f3a00bf
 
 
 
 
ce2ea41
f3a00bf
ce2ea41
f3a00bf
 
ce2ea41
 
 
f3a00bf
 
ce2ea41
f3a00bf
 
ce2ea41
 
 
f3a00bf
4deddd3
f3a00bf
 
 
86f936d
77e3da3
 
 
7320aa5
762a623
f3a00bf
762a623
43f45da
f3a00bf
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
43f45da
f3a00bf
 
43f45da
 
 
b32fdcf
f3a00bf
bb959e9
 
b7b18e5
a1f152d
 
 
 
 
 
77e3da3
e13a4c7
f3a00bf
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247

# built-in

from inspect import signature
import os
import subprocess
import logging
import re
import random
from string import ascii_letters, digits, punctuation
import requests
import sys
import warnings
import time
import asyncio
import math
from functools import partial

# external

import spaces
import torch
import gradio as gr
from lxml.html import fromstring
from huggingface_hub import hf_hub_download
from safetensors.torch import load_file, save_file
from diffusers import FluxPipeline
from PIL import Image, ImageDraw, ImageFont
from transformers import PegasusForConditionalGeneration, PegasusTokenizerFast

# logging

warnings.filterwarnings("ignore")
root = logging.getLogger()
root.setLevel(logging.WARN)
handler = logging.StreamHandler(sys.stderr)
handler.setLevel(logging.WARN)
formatter = logging.Formatter('\n >>> [%(levelname)s] %(asctime)s %(name)s: %(message)s\n')
handler.setFormatter(formatter)
root.addHandler(handler)

# constant data

if torch.cuda.is_available():
    device = "cuda"
else:
    device = "cpu"

base = "black-forest-labs/FLUX.1-schnell"
pegasus_name = "google/pegasus-xsum"

# precision data

seq=512
width=2160
height=2160
image_steps=8
img_accu=0

# ui data

css="".join(["""
input, input::placeholder {
    text-align: center !important;
}
*, *::placeholder {
    font-family: Suez One !important;
}
h1,h2,h3,h4,h5,h6 {
    width: 100%;
    text-align: center;
}
footer {
    display: none !important;
}
#col-container {
    margin: 0 auto;
}
.image-container {
    aspect-ratio: """,str(width),"/",str(height),""" !important;
}
.dropdown-arrow {
    display: none !important;
}
*:has(>.btn) {
    display: flex;
    justify-content: space-evenly;
    align-items: center;
}
.btn {
    display: flex;
}
"""])

js="""
function custom(){
    document.querySelector("div#prompt input").addEventListener("keydown",function(e){
        e.target.setAttribute("last_value",e.target.value);
    });
    document.querySelector("div#prompt input").addEventListener("input",function(e){
        if( e.target.value.toString().match(/[^ a-zA-Z,]|( |,){2,}/gsm) ){
            e.target.value = e.target.getAttribute("last_value");
            e.target.removeAttribute("last_value");
        }
    });

    document.querySelector("div#prompt2 input").addEventListener("keydown",function(e){
        e.target.setAttribute("last_value",e.target.value);
    });
    document.querySelector("div#prompt2 input").addEventListener("input",function(e){
        if( e.target.value.toString().match(/[^ a-zA-Z,]|( |,){2,}/gsm) ){
            e.target.value = e.target.getAttribute("last_value");
            e.target.removeAttribute("last_value");
        }
    });
}
"""

# torch pipes

image_pipe = FluxPipeline.from_pretrained(base, torch_dtype=torch.bfloat16).to(device)
image_pipe.enable_model_cpu_offload()

# functionality

@spaces.GPU(duration=70)
def summarize_text(
    text, max_length=30, num_beams=16, early_stopping=True, 
    pegasus_tokenizer = PegasusTokenizerFast.from_pretrained("google/pegasus-xsum"),
    pegasus_model = PegasusForConditionalGeneration.from_pretrained("google/pegasus-xsum")
):
    return pegasus_tokenizer.decode( pegasus_model.generate(
        pegasus_tokenizer(text,return_tensors="pt").input_ids,
        max_length=max_length,
        num_beams=num_beams,
        early_stopping=early_stopping
    )[0], skip_special_tokens=True)

def generate_random_string(length):
    characters = str(ascii_letters + digits)
    return ''.join(random.choice(characters) for _ in range(length))

@spaces.GPU(duration=140)
def pipe_generate(p1,p2):
    return image_pipe(
            prompt=p1,
            negative_prompt=p2,
            height=height,
            width=width,
            guidance_scale=img_accu,
            num_images_per_prompt=1,
            num_inference_steps=image_steps,
            max_sequence_length=seq,
            generator=torch.Generator(device).manual_seed(int(str(random.random()).split(".")[1]))
    ).images[0]

def handle_generate(artist,song,genre,lyrics):

    pos_artist = re.sub("([ \t\n]){1,}", " ", artist).strip()
    pos_song = re.sub("([ \t\n]){1,}", " ", song).strip()
    pos_song = ' '.join(word[0].upper() + word[1:] for word in pos_song.split())
    pos_genre = re.sub(f'[{punctuation}]', '', re.sub("([ \t\n]){1,}", " ", genre)).upper().strip()
    pos_lyrics = re.sub(f'[{punctuation}]', '', re.sub("([ \t\n]){1,}", " ", lyrics)).lower().strip()
    pos_lyrics_sum = summarize_text(pos_lyrics)
    neg = f"Textual Labeled Distorted Discontinuous Ugly Blurry"
    pos = f'Realistic Natural Genuine Reasonable Detailed { pos_genre } GENRE { pos_song } "{ pos_lyrics_sum }"'

    print(f"""
        Positive: {pos}

        Negative: {neg}
    """)
    
    img = pipe_generate(pos,neg)

    draw = ImageDraw.Draw(img)

    rows = 1
    labes_distance = math.cail(1 / 3)

    textheight=min(math.cail( width / 10 ), math.cail( height / 5 ))
    font = ImageFont.truetype(r"Alef-Bold.ttf", textheight)
    textwidth = draw.textlength(pos_song,font)
    x = math.cail((width - textwidth) / 2)
    y = math.cail((height - math.cail(textheight * rows / 2)) / 2)
    y = y - math.cail(y / labes_distance)
    draw.text((x, y), pos_song, (255,255,255), font=font)

    textheight=min(math.cail( width / 12 ), math.cail( height / 6 ))
    font = ImageFont.truetype(r"Alef-Bold.ttf", textheight)
    textwidth = draw.textlength(pos_artist,font)
    x = math.cail((width - textwidth) / 2)
    y = math.cail((height - math.cail(textheight * rows / 2)) / 2)
    y = y + math.cail(y / labes_distance)
    draw.text((x, y), pos_artist, (255,255,255), font=font)
    
    name = generate_random_string(12) + ".png"
    img.save(name)
    return name

# entry

if __name__ == "__main__":
    with gr.Blocks(theme=gr.themes.Citrus(),css=css) as demo:
        gr.Markdown(f"""
            # Song Cover Image Generator
        """)
        with gr.Row():
            with gr.Column():
                artist = gr.Textbox(
                    placeholder="Artist name",
                    container=False,
                    max_lines=1
                )
            with gr.Column():
                song = gr.Textbox(
                    placeholder="Song name",
                    container=False,
                    max_lines=1
                )
            with gr.Column():
                genre = gr.Textbox(
                    placeholder="Genre",
                    container=False,
                    max_lines=1
                )
        with gr.Row():
            lyrics = gr.Textbox(
                placeholder="Lyrics (English)",
                container=False,
                max_lines=1
            )
        with gr.Row():
            run = gr.Button("Generate",elem_classes="btn")
        with gr.Row():
            cover = gr.Image(interactive=False,container=False,elem_classes="image-container", label="Result", show_label=True, type='filepath', show_share_button=False)

        run.click(
            fn=handle_generate,
            inputs=[artist,song,genre,lyrics],
            outputs=[cover]
        )

    demo.queue().launch()

# end