FLUX-Open-Ghibli-Studio

Running on Zero

App Files Files Community

ginipick commited on Apr 2

Commit

1b3b25e

verified ·

1 Parent(s): a9938b5

Update app.py

Browse files

Files changed (1) hide show

app.py +150 -2

app.py CHANGED Viewed

@@ -161,6 +161,39 @@ def caption_image(image, model_name='gokaygokay/Florence-2-Flux-Large'):
     )
     return parsed_answer["<DESCRIPTION>"]
 # ----------------------------- Gradio UI --------------------------------------
 with gr.Blocks(analytics_enabled=False) as demo:
     with gr.Tabs():
@@ -264,7 +297,122 @@ with gr.Blocks(analytics_enabled=False) as demo:
                 inputs=[input_img, model_selector],
                 outputs=[caption_output]
             )
-# Just remove or simplify the queue call if needed:
-demo.launch(debug=True)

     )
     return parsed_answer["<DESCRIPTION>"]
+# --------- NEW FUNCTION: Process uploaded image and generate Ghibli style image ---------
+@spaces.GPU(duration=120)
+def process_uploaded_image(
+    image,
+    model_name,
+    seed,
+    randomize_seed,
+    width,
+    height,
+    guidance_scale,
+    num_inference_steps,
+    lora_scale
+):
+    # Step 1: Generate caption from the uploaded image
+    caption = caption_image(image, model_name)
+    # Step 2: Append "ghibli style" to the caption
+    ghibli_prompt = f"{caption}, ghibli style"
+    # Step 3: Generate Ghibli-style image based on the caption
+    generated_image, used_seed = inference(
+        prompt=ghibli_prompt,
+        seed=seed,
+        randomize_seed=randomize_seed,
+        width=width,
+        height=height,
+        guidance_scale=guidance_scale,
+        num_inference_steps=num_inference_steps,
+        lora_scale=lora_scale
+    )
+    return generated_image, used_seed, caption, ghibli_prompt
 # ----------------------------- Gradio UI --------------------------------------
 with gr.Blocks(analytics_enabled=False) as demo:
     with gr.Tabs():
                 inputs=[input_img, model_selector],
                 outputs=[caption_output]
             )
+        # ------------------ NEW TAB 3: Image to Ghibli Style ---------------------------
+        with gr.TabItem("이미지 to 지브리 스타일"):
+            gr.Markdown("## Upload an image and transform it to Ghibli style")
+            with gr.Row():
+                with gr.Column():
+                    upload_img = gr.Image(label="Upload an Image")
+                    caption_model_selector = gr.Dropdown(
+                        choices=list(models.keys()),
+                        value='gokaygokay/Florence-2-Flux-Large',
+                        label="Caption Model",
+                        visible=False  # Hidden as requested
+                    )
+                    with gr.Row():
+                        img2img_seed = gr.Slider(
+                            label="Seed",
+                            minimum=0,
+                            maximum=MAX_SEED,
+                            step=1,
+                            value=42
+                        )
+                        img2img_randomize_seed = gr.Checkbox(label="Randomize seed", value=True)
+                    with gr.Row():
+                        img2img_width = gr.Slider(
+                            label="Width",
+                            minimum=256,
+                            maximum=MAX_IMAGE_SIZE,
+                            step=32,
+                            value=512
+                        )
+                        img2img_height = gr.Slider(
+                            label="Height",
+                            minimum=256,
+                            maximum=MAX_IMAGE_SIZE,
+                            step=32,
+                            value=512
+                        )
+                    with gr.Row():
+                        img2img_guidance_scale = gr.Slider(
+                            label="Guidance scale",
+                            minimum=0.0,
+                            maximum=10.0,
+                            step=0.1,
+                            value=3.5
+                        )
+                        img2img_steps = gr.Slider(
+                            label="Steps",
+                            minimum=1,
+                            maximum=50,
+                            step=1,
+                            value=30
+                        )
+                    img2img_lora_scale = gr.Slider(
+                        label="LoRA scale",
+                        minimum=0.0,
+                        maximum=1.0,
+                        step=0.1,
+                        value=1.0
+                    )
+                    transform_button = gr.Button("Transform to Ghibli Style")
+                with gr.Column():
+                    ghibli_output_image = gr.Image(label="Generated Ghibli Image")
+                    ghibli_output_seed = gr.Number(label="Seed Used")
+                    extracted_caption = gr.Textbox(
+                        label="Extracted Description",
+                        visible=False  # Hidden as requested
+                    )
+                    ghibli_prompt = gr.Textbox(
+                        label="Generated Prompt",
+                        visible=False  # Hidden as requested
+                    )
+            # Auto-process when image is uploaded
+            upload_img.upload(
+                process_uploaded_image,
+                inputs=[
+                    upload_img,
+                    caption_model_selector,
+                    img2img_seed,
+                    img2img_randomize_seed,
+                    img2img_width,
+                    img2img_height,
+                    img2img_guidance_scale,
+                    img2img_steps,
+                    img2img_lora_scale,
+                ],
+                outputs=[
+                    ghibli_output_image,
+                    ghibli_output_seed,
+                    extracted_caption,
+                    ghibli_prompt,
+                ]
+            )
+            # Manual process button
+            transform_button.click(
+                process_uploaded_image,
+                inputs=[
+                    upload_img,
+                    caption_model_selector,
+                    img2img_seed,
+                    img2img_randomize_seed,
+                    img2img_width,
+                    img2img_height,
+                    img2img_guidance_scale,
+                    img2img_steps,
+                    img2img_lora_scale,
+                ],
+                outputs=[
+                    ghibli_output_image,
+                    ghibli_output_seed,
+                    extracted_caption,
+                    ghibli_prompt,
+                ]
+            )
+demo.launch(debug=True)