Spaces:

Kidbea
/

Kidbea_Image_Generation

Runtime error

File size: 4,258 Bytes

c34a1b5
8d7b14b
c34a1b5
8d7b14b
c34a1b5
 
 
188c627
c34a1b5
796e120
c34a1b5
5507320
c34a1b5
8d7b14b
c34a1b5
8d7b14b
ad0688d
 
c34a1b5
ad0688d
c34a1b5
 
 
92b1b58
c34a1b5
796e120
c34a1b5
 
 
796e120
c34a1b5
4570550
 
 
 
 
c34a1b5
796e120
8d7b14b
796e120
8d7b14b
c34a1b5
 
 
 
 
 
 
 
 
 
 
4570550
 
c34a1b5
4570550
c34a1b5
 
 
4570550
 
c34a1b5
 
 
4570550
c34a1b5
 
 
 
 
 
 
4570550
 
c34a1b5
 
796e120
 
c34a1b5
4570550
796e120
4570550
c34a1b5
 
 
 
4570550
c34a1b5
 
 
 
 
 
8d7b14b
c34a1b5
 
 
 
 
4570550
 
 
 
 
 
c34a1b5
 
 
 
 
 
 
 
4570550
c34a1b5
8d7b14b
c34a1b5
4570550
b46eefe
796e120

import gradio as gr
import torch
import numpy as np
from diffusers import DiffusionPipeline
from diffusers.pipelines.stable_diffusion import StableDiffusionSafetyChecker
from functools import lru_cache
from PIL import Image

from torchvision import transforms
from transformers import CLIPImageProcessor  # Updated import


@lru_cache(maxsize=1)
def load_pipeline():
    # Load base model
    base_model = "black-forest-labs/FLUX.1-dev"
    pipe = DiffusionPipeline.from_pretrained(
        base_model,
        torch_dtype=torch.bfloat16
    )
    
    # Load LoRA weights
    lora_repo = "strangerzonehf/Flux-Super-Realism-LoRA"
    pipe.load_lora_weights(lora_repo)
    
    # Load safety checker and image processor
    safety_checker = StableDiffusionSafetyChecker.from_pretrained(
        "CompVis/stable-diffusion-safety-checker"
    )
    image_processor = CLIPImageProcessor.from_pretrained("openai/clip-vit-base-patch32")
    
    # Optimizations: enable memory efficient attention if using GPU
    device = torch.device("cuda" if torch.cuda.is_available() else "cpu")
    if device.type == "cuda":
        pipe.enable_xformers_memory_efficient_attention()
    pipe = pipe.to(device)
    
    return pipe, safety_checker, image_processor

pipe, safety_checker, image_processor = load_pipeline()

def generate_image(
    prompt,
    seed=42,
    width=1024,
    height=1024,
    guidance_scale=6,
    steps=28,
    progress=gr.Progress()
):
    try:
        progress(0, desc="Initializing...")
        device = torch.device("cuda" if torch.cuda.is_available() else "cpu")
        generator = torch.Generator(device=device).manual_seed(seed)
        
        # Auto-add trigger words if not present
        if "super realism" not in prompt.lower():
            prompt = f"Super Realism, {prompt}"
        
        # Define the callback function with the proper signature
        def update_progress(step, timestep, latents):
            progress((step + 1) / steps, desc="Generating image...")
        
        with torch.inference_mode():
            result = pipe(
                prompt=prompt,
                width=width,
                height=height,
                guidance_scale=guidance_scale,
                num_inference_steps=steps,
                generator=generator,
                callback=update_progress
            )
            image = result.images[0]
        
        progress(1, desc="Safety checking...")
        # Preprocess image for safety checking using the updated image processor
        safety_input = image_processor(image, return_tensors="pt")
        np_image = np.array(image)
        
        # Unpack safety checker results
        _, nsfw_detected = safety_checker(
            images=[np_image], 
            clip_input=safety_input.pixel_values
        )
        
        if nsfw_detected[0]:
            return Image.new("RGB", (512, 512)), "NSFW content detected"
        
        return image, "Generation successful"
    
    except Exception as e:
        return Image.new("RGB", (512, 512)), f"Error: {str(e)}"

with gr.Blocks() as app:
    gr.Markdown("# Flux Super Realism Generator")
    
    with gr.Row():
        with gr.Column():
            prompt_input = gr.Textbox(label="Prompt", value="A portrait of a person")
            seed_input = gr.Slider(0, 1000, value=42, label="Seed")
            width_input = gr.Slider(512, 2048, value=1024, label="Width")
            height_input = gr.Slider(512, 2048, value=1024, label="Height")
            guidance_input = gr.Slider(1, 20, value=6, label="Guidance Scale")
            steps_input = gr.Slider(10, 100, value=28, label="Steps")
            submit = gr.Button("Generate")
        
        with gr.Column():
            output_image = gr.Image(label="Result", type="pil")
            status = gr.Textbox(label="Status")
    
    submit.click(
        generate_image,
        inputs=[prompt_input, seed_input, width_input, height_input, guidance_input, steps_input],
        outputs=[output_image, status]
    )
    
    # Rate limiting: 1 request at a time, with a max queue size of 3
    app.queue(max_size=3).launch()

# Uncomment for advanced multiple GPU support:
# pipe.enable_model_cpu_offload()
# pipe.enable_sequential_cpu_offload()