Spaces:

vvaibhav
/

inpainting_background_swapper

Runtime error

App Files Files Community

vvaibhav commited on Jan 15

Commit

a99346b

verified ·

1 Parent(s): 19001b5

Update app.py

Browse files

Files changed (1) hide show

app.py +207 -53

app.py CHANGED Viewed

@@ -1,12 +1,14 @@
 # app.py
 import gradio as gr
-from PIL import Image
 import torch
 import numpy as np
 from transformers import SamModel, SamProcessor
 from diffusers import StableDiffusionInpaintPipeline
-import io
 # Initialize SAM model and processor on CPU
 sam_model = SamModel.from_pretrained("facebook/sam-vit-huge", torch_dtype=torch.float32).to("cpu")
@@ -19,6 +21,10 @@ inpaint_pipeline = StableDiffusionInpaintPipeline.from_pretrained(
 ).to("cpu")
 # No need for model_cpu_offload on CPU
 def mask_to_rgba(mask):
     """
     Converts a binary mask to an RGBA image for visualization.
@@ -126,70 +132,218 @@ def visualize_mask(image, mask):
     overlay = Image.alpha_composite(image.convert("RGBA"), mask_pil)
     return overlay.convert("RGB")
-def process(image, points, prompt, negative_prompt, seed, guidance_scale):
     """
-    Processes the image by replacing the selected object based on the prompt.
     Args:
-        image (PIL.Image): Uploaded image.
-        points (list of lists): Points selected on the image.
-        prompt (str): Text prompt for replacement.
-        negative_prompt (str): Negative text prompt.
-        seed (int): Seed for reproducibility.
-        guidance_scale (float): Guidance scale.
     Returns:
-        Tuple of images: Original with mask overlay and augmented image.
     """
-    mask = generate_mask(image, points)
-    masked_image = visualize_mask(image, mask)
-    augmented_image = replace_object(image, mask, prompt, negative_prompt, seed, guidance_scale)
-    return masked_image, augmented_image
-# Define Gradio Interface
-with gr.Blocks() as demo:
-    gr.Markdown("# Object Replacement App")
-    gr.Markdown(
-        """
-        Upload an image, select points on the object you want to replace, provide a text prompt for the replacement, and view the augmented image.
-        """
-    )
-    with gr.Row():
-        with gr.Column():
-            image_input = gr.Image(label="Upload Image", type="pil", interactive=True, elem_id="image")
-            points_input = gr.Points(
-                label="Select Points on the Object",
-                show_label=True,
-                source="image",  # Links Points to the Image component via elem_id
-                interactive=True
-            )
-            prompt_input = gr.Textbox(label="Replacement Prompt", placeholder="e.g., a red sports car", lines=2)
-            negative_prompt_input = gr.Textbox(label="Negative Prompt", placeholder="e.g., blurry, low quality", lines=2)
-            seed_input = gr.Number(label="Seed", value=42)
-            guidance_scale_input = gr.Slider(label="Guidance Scale", minimum=1, maximum=20, value=7.5)
-            process_button = gr.Button("Replace Object")
-        with gr.Column():
-            masked_output = gr.Image(label="Selected Object Mask Overlay")
-            augmented_output = gr.Image(label="Augmented Image")
-    # Bind the process function to the button click
-    process_button.click(
-        fn=process,
-        inputs=[image_input, points_input, prompt_input, negative_prompt_input, seed_input, guidance_scale_input],
-        outputs=[masked_output, augmented_output]
-    )
-    gr.Markdown(
         """
         **Instructions:**
-        1. **Upload Image:** Upload the image containing the object you want to replace.
-        2. **Select Points:** Click on the image to select points on the object. Use multiple points for better mask accuracy.
         3. **Enter Prompts:** Provide a replacement prompt and optionally a negative prompt to refine the output.
         4. **Adjust Settings:** Set the seed for reproducibility and adjust the guidance scale as needed.
         5. **Replace Object:** Click the "Replace Object" button to generate the augmented image.
-        """
-    )
 # Launch the app
-demo.launch()

 # app.py
 import gradio as gr
+from PIL import Image, ImageDraw
 import torch
 import numpy as np
 from transformers import SamModel, SamProcessor
 from diffusers import StableDiffusionInpaintPipeline
+# Constants
+IMG_SIZE = 512
 # Initialize SAM model and processor on CPU
 sam_model = SamModel.from_pretrained("facebook/sam-vit-huge", torch_dtype=torch.float32).to("cpu")
 ).to("cpu")
 # No need for model_cpu_offload on CPU
+# Global variables to store points and the original image
+input_points = []
+input_image = None
 def mask_to_rgba(mask):
     """
     Converts a binary mask to an RGBA image for visualization.
     overlay = Image.alpha_composite(image.convert("RGBA"), mask_pil)
     return overlay.convert("RGB")
+def get_points(img, evt: gr.SelectData):
     """
+    Captures points selected by the user on the image.
     Args:
+        img (PIL.Image): The uploaded image.
+        evt (gr.SelectData): Event data containing the point coordinates.
     Returns:
+        Tuple: (Updated mask visualization, Updated image with crossmarks)
     """
+    global input_points
+    global input_image
+    # The first time this is called, save the untouched input image
+    if len(input_points) == 0:
+        input_image = img.copy()
+    x = evt.index[0]
+    y = evt.index[1]
+    input_points.append([x, y])
+    # Run SAM to generate mask
+    mask = generate_mask(input_image, input_points)
+    # Mark selected points with a green crossmark
+    draw = ImageDraw.Draw(img)
+    size = 10
+    for point in input_points:
+        px, py = point
+        draw.line((px - size, py, px + size, py), fill="green", width=5)
+        draw.line((px, py - size, px, py + size), fill="green", width=5)
+    # Visualize the mask overlay
+    masked_image = visualize_mask(input_image, mask)
+    return masked_image, img
+def run_inpaint(prompt, negative_prompt, cfg, seed, invert):
+    """
+    Runs the inpainting process based on user inputs.
+    Args:
+        prompt (str): Prompt for infill.
+        negative_prompt (str): Negative prompt.
+        cfg (float): Classifier-Free Guidance Scale.
+        seed (int): Random seed.
+        invert (bool): Whether to infill the subject instead of the background.
+    Returns:
+        PIL.Image: The inpainted image.
+    """
+    global input_image
+    global input_points
+    if input_image is None or len(input_points) == 0:
+        raise gr.Error("No points provided. Click on the image to select the object to segment with SAM.")
+    mask = generate_mask(input_image, input_points)
+    if invert:
+        what = 'subject'
+        mask = ~mask
+    else:
+        what = 'background'
+    try:
+        inpainted = replace_object(input_image, mask, prompt, negative_prompt, seed, cfg)
+    except Exception as e:
+        raise gr.Error(str(e))
+    return inpainted.resize((IMG_SIZE, IMG_SIZE))
+def reset_points_func():
+    """
+    Resets the selected points and the input image.
+    Returns:
+        Tuple: (Reset mask visualization, Reset image, Empty inpainted image)
+    """
+    global input_points
+    global input_image
+    input_points = []
+    input_image = None
+    return None, None, None
+def preprocess(input_img):
+    """
+    Preprocesses the uploaded image to ensure it is square and resized.
+    Args:
+        input_img (PIL.Image): The uploaded image.
+    Returns:
+        PIL.Image: The preprocessed image.
+    """
+    if input_img is None:
+        return None
+    # Make sure the image is square
+    width, height = input_img.size
+    if width != height:
+        # Add white padding to make the image square
+        new_size = max(width, height)
+        new_image = Image.new("RGB", (new_size, new_size), 'white')
+        left = (new_size - width) // 2
+        top = (new_size - height) // 2
+        new_image.paste(input_img, (left, top))
+        input_img = new_image
+    return input_img.resize((IMG_SIZE, IMG_SIZE))
+def build_app(get_processed_inputs, inpaint):
+    """
+    Builds and launches the Gradio app.
+    Args:
+        get_processed_inputs (function): Function to process inputs for SAM.
+        inpaint (function): Function to perform inpainting.
+    Returns:
+        None
+    """
+    with gr.Blocks() as demo:
+        gr.Markdown(
         """
+        # Object Replacement App
+        Upload an image, select points on the object you want to replace, provide a text prompt for the replacement, and view the augmented image.
         **Instructions:**
+        1. **Upload Image:** Click on the first image box to upload your image.
+        2. **Select Points:** Click on the image to select points on the object you wish to replace. Use multiple points for better mask accuracy.
         3. **Enter Prompts:** Provide a replacement prompt and optionally a negative prompt to refine the output.
         4. **Adjust Settings:** Set the seed for reproducibility and adjust the guidance scale as needed.
         5. **Replace Object:** Click the "Replace Object" button to generate the augmented image.
+        6. **Reset:** Click the "Reset" button to clear selections and start over.
+        """)
+        with gr.Row():
+            with gr.Column():
+                # Image upload and point selection
+                upload_image = gr.Image(label="Upload Image", type="pil", interactive=True)
+                mask_visualization = gr.Image(label="Selected Object Mask Overlay", interactive=False)
+                selected_image = gr.Image(label="Image with Selected Points", type="pil", interactive=False)
+                # Capture points using the select event
+                upload_image.select(get_points, inputs=[upload_image], outputs=[mask_visualization, selected_image])
+                # Preprocess image on change
+                upload_image.change(preprocess, inputs=[upload_image], outputs=[upload_image])
+                # Text inputs and settings
+                prompt = gr.Textbox(label="Replacement Prompt", placeholder="e.g., a red sports car", lines=2)
+                negative_prompt = gr.Textbox(label="Negative Prompt", placeholder="e.g., blurry, low quality", lines=2)
+                cfg = gr.Slider(
+                    label="Classifier-Free Guidance Scale",
+                    minimum=1.0,
+                    maximum=20.0,
+                    value=7.5,
+                    step=0.5
+                )
+                seed = gr.Number(label="Seed", value=42, precision=0)
+                invert = gr.Checkbox(label="Infill subject instead of background")
+                # Buttons
+                replace_button = gr.Button("Replace Object")
+                reset_button = gr.Button("Reset")
+            with gr.Column():
+                # Output images
+                augmented_image = gr.Image(label="Augmented Image", type="pil", interactive=False)
+        # Define button actions
+        replace_button.click(
+            fn=run_inpaint,
+            inputs=[prompt, negative_prompt, cfg, seed, invert],
+            outputs=[augmented_image]
+        )
+        reset_button.click(
+            fn=reset_points_func,
+            inputs=[],
+            outputs=[mask_visualization, selected_image, augmented_image]
+        )
+        # Examples (optional)
+        gr.Markdown(
+            """
+            ## EXAMPLES
+            Click on an example to load it. Then, follow the instructions above.
+            """)
+        with gr.Row():
+            examples = gr.Examples(
+                examples=[
+                    ["car.png", "a red sports car", "blurry, low quality", 42],
+                    ["house.jpg", "a modern villa", "dark, overexposed", 123],
+                    ["tree.png", "a blooming cherry tree", "underexposed, low contrast", 999]
+                ],
+                inputs=[
+                    upload_image,
+                    prompt,
+                    negative_prompt,
+                    seed
+                ],
+                label="Click to load examples",
+                cache_examples=True
+            )
+    demo.queue(max_size=10).launch()
 # Launch the app
+build_app(None, None)