Spaces:

vvaibhav
/

inpainting_background_swapper

Running

App Files Files Community

vvaibhav commited on Jan 15

Commit

18c979d

verified ·

1 Parent(s): 13cac7d

Create app.py

Browse files

Files changed (1) hide show

app.py +190 -0

app.py ADDED Viewed

	@@ -0,0 +1,190 @@

+# app.py
+import gradio as gr
+from PIL import Image
+import torch
+import numpy as np
+from transformers import SamModel, SamProcessor
+from diffusers import StableDiffusionInpaintPipeline
+import io
+# Initialize SAM model and processor
+sam_model = SamModel.from_pretrained("facebook/sam-vit-huge").to("cuda")
+sam_processor = SamProcessor.from_pretrained("facebook/sam-vit-huge")
+# Initialize Inpainting pipeline
+inpaint_pipeline = StableDiffusionInpaintPipeline.from_pretrained(
+    "runwayml/stable-diffusion-inpainting",
+    torch_dtype=torch.float16
+).to("cuda")
+inpaint_pipeline.enable_model_cpu_offload()
+def mask_to_rgba(mask):
+    """
+    Converts a binary mask to an RGBA image for visualization.
+    """
+    bg_transparent = np.zeros(mask.shape + (4,), dtype=np.uint8)
+    bg_transparent[mask == 1] = [0, 255, 0, 127]  # Green with transparency
+    return bg_transparent
+def generate_mask(image, input_points):
+    """
+    Generates a binary mask using SAM based on input points.
+    Args:
+        image (PIL.Image): The input image.
+        input_points (list of lists): List of points selected by the user.
+    Returns:
+        np.ndarray: Binary mask where the object is marked with 1s.
+    """
+    if not input_points:
+        return None
+    # Convert image to RGB if not already
+    image = image.convert("RGB")
+    # Flatten the list of points
+    points = [tuple(point) for point in input_points]
+    # Prepare inputs for SAM
+    inputs = sam_processor(image, points=points, return_tensors="pt").to("cuda")
+    with torch.no_grad():
+        outputs = sam_model(**inputs)
+    # Post-process masks
+    masks = sam_processor.image_processor.post_process_masks(
+        outputs.pred_masks.cpu(),
+        inputs["original_sizes"].cpu(),
+        inputs["reshaped_input_sizes"].cpu()
+    )
+    if len(masks) == 0:
+        return None
+    # Select the mask with the highest IoU score
+    best_mask = masks[0][0][outputs.iou_scores.argmax()]
+    # Invert mask: object=1, background=0
+    binary_mask = ~best_mask.numpy().astype(bool).astype(int)
+    return binary_mask
+def replace_object(image, mask, prompt, negative_prompt, seed, guidance_scale):
+    """
+    Replaces the selected object in the image based on the prompt.
+    Args:
+        image (PIL.Image): The original image.
+        mask (np.ndarray): Binary mask of the selected object.
+        prompt (str): Text prompt describing the replacement.
+        negative_prompt (str): Negative text prompt to refine generation.
+        seed (int): Random seed for reproducibility.
+        guidance_scale (float): Guidance scale for the inpainting model.
+    Returns:
+        PIL.Image: The augmented image with the object replaced.
+    """
+    if mask is None:
+        return image
+    mask_image = Image.fromarray((mask * 255).astype(np.uint8))
+    generator = torch.Generator("cuda").manual_seed(seed)
+    try:
+        result = inpaint_pipeline(
+            prompt=prompt,
+            image=image,
+            mask_image=mask_image,
+            negative_prompt=negative_prompt if negative_prompt else None,
+            generator=generator,
+            guidance_scale=guidance_scale
+        ).images[0]
+        return result
+    except Exception as e:
+        print(f"Inpainting error: {e}")
+        return image
+def visualize_mask(image, mask):
+    """
+    Overlays the mask on the image for visualization.
+    Args:
+        image (PIL.Image): The original image.
+        mask (np.ndarray): Binary mask of the selected object.
+    Returns:
+        PIL.Image: Image with mask overlay.
+    """
+    if mask is None:
+        return image
+    mask_rgba = mask_to_rgba(mask)
+    mask_pil = Image.fromarray(mask_rgba)
+    overlay = Image.alpha_composite(image.convert("RGBA"), mask_pil)
+    return overlay.convert("RGB")
+def process(image, points, prompt, negative_prompt, seed, guidance_scale):
+    """
+    Processes the image by replacing the selected object based on the prompt.
+    Args:
+        image (PIL.Image): Uploaded image.
+        points (list of lists): Points selected on the image.
+        prompt (str): Text prompt for replacement.
+        negative_prompt (str): Negative text prompt.
+        seed (int): Seed for reproducibility.
+        guidance_scale (float): Guidance scale.
+    Returns:
+        Tuple of images: Original with mask overlay and augmented image.
+    """
+    mask = generate_mask(image, points)
+    masked_image = visualize_mask(image, mask)
+    augmented_image = replace_object(image, mask, prompt, negative_prompt, seed, guidance_scale)
+    return masked_image, augmented_image
+# Define Gradio Interface
+with gr.Blocks() as demo:
+    gr.Markdown("# Object Replacement App")
+    gr.Markdown(
+        """
+        Upload an image, select points on the object you want to replace, provide a text prompt for the replacement, and view the augmented image.
+        """
+    )
+    with gr.Row():
+        with gr.Column():
+            image_input = gr.Image(label="Upload Image", type="pil")
+            prompt_input = gr.Textbox(label="Replacement Prompt", placeholder="e.g., a red sports car", lines=2)
+            negative_prompt_input = gr.Textbox(label="Negative Prompt", placeholder="e.g., blurry, low quality", lines=2)
+            seed_input = gr.Number(label="Seed", value=42)
+            guidance_scale_input = gr.Slider(label="Guidance Scale", minimum=1, maximum=20, value=7.5)
+            process_button = gr.Button("Replace Object")
+        with gr.Column():
+            masked_output = gr.Image(label="Selected Object Mask Overlay")
+            augmented_output = gr.Image(label="Augmented Image")
+    image_input.change(fn=lambda img: img, inputs=image_input, outputs=masked_output)
+    process_button.click(
+        fn=process,
+        inputs=[image_input, gr.State(), prompt_input, negative_prompt_input, seed_input, guidance_scale_input],
+        outputs=[masked_output, augmented_output]
+    )
+    gr.Markdown(
+        """
+        **Instructions:**
+        1. **Upload Image:** Upload the image containing the object you want to replace.
+        2. **Select Points:** Click on the image to select points on the object. Use multiple points for better mask accuracy.
+        3. **Enter Prompts:** Provide a replacement prompt and optionally a negative prompt to refine the output.
+        4. **Adjust Settings:** Set the seed for reproducibility and adjust the guidance scale as needed.
+        5. **Replace Object:** Click the "Replace Object" button to generate the augmented image.
+        """
+    )
+# Launch the app
+demo.launch()