flxgif

Running on Zero

App Files Files Community

aiqtech commited on 2 days ago

Commit

856ab89

verified ·

1 Parent(s): 28192a4

Update app.py

Browse files

Files changed (1) hide show

app.py +115 -63

app.py CHANGED Viewed

@@ -8,110 +8,162 @@ from PIL import Image
 from diffusers.utils import export_to_gif
 from transformers import pipeline
-HEIGHT = 256
-WIDTH = 1024
 MAX_SEED = np.iinfo(np.int32).max
 device = "cuda" if torch.cuda.is_available() else "cpu"
-pipe = FluxPipeline.from_pretrained(
-    "black-forest-labs/FLUX.1-dev",
-    torch_dtype=torch.bfloat16
-).to(device)
 translator = pipeline("translation", model="Helsinki-NLP/opus-mt-ko-en")
-def split_image(input_image, num_splits=4):
-    output_images = []
-    for i in range(num_splits):
-        left = i * 256
-        right = (i + 1) * 256
-        box = (left, 0, right, 256)
-        output_images.append(input_image.crop(box))
-    return output_images
-def translate_to_english(text):
-    return translator(text)[0]['translation_text']
 @spaces.GPU()
-def predict(prompt, seed=42, randomize_seed=False, guidance_scale=5.0, num_inference_steps=28, progress=gr.Progress(track_tqdm=True)):
-    if any('\u3131' <= char <= '\u318E' or '\uAC00' <= char <= '\uD7A3' for char in prompt):
         prompt = translate_to_english(prompt)
-    prompt_template = f"""
-    A side by side 4 frame image showing consecutive stills from a looped gif moving from left to right. The gif is of {prompt}.
-    """
     if randomize_seed:
         seed = random.randint(0, MAX_SEED)
     image = pipe(
         prompt=prompt_template,
         guidance_scale=guidance_scale,
         num_inference_steps=num_inference_steps,
         num_images_per_prompt=1,
-        generator=torch.Generator("cpu").manual_seed(seed),
-        height=HEIGHT,
-        width=WIDTH
     ).images[0]
-    return export_to_gif(split_image(image, 4), "flux.gif", fps=4), image, seed
 css = """
-footer { visibility: hidden;}
 """
 examples = [
-    "고양이가 공중에서 발을 흔드는 모습",
-    "팬더가 엉덩이를 좌우로 흔드는 모습",
-    "꽃이 피어나는 과정"
 ]
 with gr.Blocks(theme="soft", css=css) as demo:
     with gr.Column(elem_id="col-container"):
         with gr.Row():
-            prompt = gr.Text(label="프롬프트", show_label=False, max_lines=1, placeholder="프롬프트를 입력하세요")
-            submit = gr.Button("제출", scale=0)
-        output = gr.Image(label="GIF", show_label=False)
-        output_stills = gr.Image(label="스틸 이미지", show_label=False, elem_id="stills")
-        with gr.Accordion("고급 설정", open=False):
-            seed = gr.Slider(
-                label="시드",
-                minimum=0,
-                maximum=MAX_SEED,
-                step=1,
-                value=0,
             )
-            randomize_seed = gr.Checkbox(label="시드 무작위화", value=True)
             with gr.Row():
                 guidance_scale = gr.Slider(
-                    label="가이던스 스케일",
-                    minimum=1,
-                    maximum=15,
-                    step=0.1,
-                    value=3.5,
                 )
                 num_inference_steps = gr.Slider(
-                    label="추론 단계 수",
-                    minimum=1,
-                    maximum=50,
-                    step=1,
-                    value=28,
                 )
         gr.Examples(
             examples=examples,
             fn=predict,
             inputs=[prompt],
-            outputs=[output, output_stills, seed],
-            cache_examples="lazy"
         )
         gr.on(
             triggers=[submit.click, prompt.submit],
             fn=predict,
-            inputs=[prompt, seed, randomize_seed, guidance_scale, num_inference_steps],
-            outputs=[output, output_stills, seed]
         )
-demo.launch()

 from diffusers.utils import export_to_gif
 from transformers import pipeline
+# -------------------------
+# Configuration constants
+# -------------------------
+FRAMES = 4                      # number of stills laid out horizontally
+DEFAULT_HEIGHT = 256            # per‑frame size (px)
+DEFAULT_FPS = 8                 # smoother playback than the original 4 fps
 MAX_SEED = np.iinfo(np.int32).max
+# -------------------------
+# Model initialisation
+# -------------------------
 device = "cuda" if torch.cuda.is_available() else "cpu"
+pipe = (
+    FluxPipeline.from_pretrained(
+        "black-forest-labs/FLUX.1-dev",
+        torch_dtype=torch.float16,      # slightly higher precision than bfloat16 for crisper output
+    )
+    .to(device)
+)
+# English is the primary UI language, but Korean prompts are still accepted & translated.
 translator = pipeline("translation", model="Helsinki-NLP/opus-mt-ko-en")
+# -------------------------
+# Helper functions
+# -------------------------
+def split_image(input_image: Image.Image, frame_size: int) -> list[Image.Image]:
+    """Cut a wide strip into equal square frames."""
+    return [
+        input_image.crop((i * frame_size, 0, (i + 1) * frame_size, frame_size))
+        for i in range(FRAMES)
+    ]
+def translate_to_english(text: str) -> str:
+    """Translate Korean text to English if necessary."""
+    return translator(text)[0]["translation_text"]
 @spaces.GPU()
+def predict(
+    prompt: str,
+    seed: int = 42,
+    randomize_seed: bool = False,
+    guidance_scale: float = 7.0,
+    num_inference_steps: int = 40,
+    height: int = DEFAULT_HEIGHT,
+    fps: int = DEFAULT_FPS,
+    progress: gr.Progress = gr.Progress(track_tqdm=True),
+):
+    # 1) Language handling
+    if any("\u3131" <= ch <= "\u318E" or "\uAC00" <= ch <= "\uD7A3" for ch in prompt):
         prompt = translate_to_english(prompt)
+    # 2) Prompt template
+    prompt_template = (
+        f"A side-by-side {FRAMES} frame image showing consecutive stills from a looped gif moving left to right. "
+        f"The gif is of {prompt}."
+    )
+    # 3) Seed control
     if randomize_seed:
         seed = random.randint(0, MAX_SEED)
+    width = FRAMES * height  # maintain square frames
+    # 4) Generation
     image = pipe(
         prompt=prompt_template,
         guidance_scale=guidance_scale,
         num_inference_steps=num_inference_steps,
         num_images_per_prompt=1,
+        generator=torch.Generator(device).manual_seed(seed),
+        height=height,
+        width=width,
     ).images[0]
+    # 5) Assemble gif
+    gif_path = export_to_gif(split_image(image, height), "flux.gif", fps=fps)
+    return gif_path, image, seed
+# -------------------------
+# Interface
+# -------------------------
 css = """
+#col-container {max-width: 820px; margin: 0 auto;}
+footer {visibility: hidden;}
 """
 examples = [
+    "cat lazily swinging its paws in mid-air",
+    "panda shaking its hips",
+    "flower blooming in timelapse",
 ]
 with gr.Blocks(theme="soft", css=css) as demo:
+    gr.Markdown("<h1 style='text-align:center'>FLUX GIF Generator</h1>")
     with gr.Column(elem_id="col-container"):
+        # Prompt row
         with gr.Row():
+            prompt = gr.Text(
+                label="", show_label=False, max_lines=1, placeholder="Enter your prompt here…"
             )
+            submit = gr.Button("Generate", scale=0)
+        # Outputs
+        output_gif = gr.Image(label="", show_label=False)
+        output_stills = gr.Image(label="", show_label=False, elem_id="stills")
+        # Advanced controls
+        with gr.Accordion("Advanced settings", open=False):
+            seed = gr.Slider(label="Seed", minimum=0, maximum=MAX_SEED, step=1, value=0)
+            randomize_seed = gr.Checkbox(label="Randomize seed", value=True)
             with gr.Row():
                 guidance_scale = gr.Slider(
+                    label="Guidance scale", minimum=1, maximum=15, step=0.1, value=7.0
                 )
                 num_inference_steps = gr.Slider(
+                    label="Inference steps", minimum=10, maximum=60, step=1, value=40
                 )
+            with gr.Row():
+                height = gr.Slider(
+                    label="Frame size (px)", minimum=256, maximum=512, step=64, value=DEFAULT_HEIGHT
+                )
+                fps = gr.Slider(
+                    label="GIF FPS", minimum=4, maximum=20, step=1, value=DEFAULT_FPS
+                )
+        # Example prompts
         gr.Examples(
             examples=examples,
             fn=predict,
             inputs=[prompt],
+            outputs=[output_gif, output_stills, seed],
+            cache_examples="lazy",
         )
+        # Event wiring
         gr.on(
             triggers=[submit.click, prompt.submit],
             fn=predict,
+            inputs=[
+                prompt,
+                seed,
+                randomize_seed,
+                guidance_scale,
+                num_inference_steps,
+                height,
+                fps,
+            ],
+            outputs=[output_gif, output_stills, seed],
         )
+demo.launch()