Wan2.1

Running

File size: 6,949 Bytes

4e424ea
ca753f0
4e424ea
3893fde
632fdb4
7bedcdd
4e424ea
 
 
 
 
 
 
 
ca753f0
73566e5
9220522
 
 
 
935512c
9220522
4d169d8
 
 
 
9220522
935512c
665534e
935512c
9220522
 
632fdb4
9220522
 
 
 
665534e
4e424ea
9d714b0
4e424ea
 
 
 
 
f0f4c78
4e424ea
 
 
632fdb4
 
 
 
 
 
 
9220522
9d714b0
632fdb4
 
 
 
 
 
 
 
9220522
632fdb4
 
9220522
632fdb4
9d714b0
 
632fdb4
 
 
 
9d714b0
9220522
665534e
 
 
 
 
632fdb4
 
9220522
632fdb4
 
 
 
 
 
 
9220522
632fdb4
 
 
9220522
632fdb4
9220522
632fdb4
 
9220522
 
 
 
 
 
 
632fdb4
9220522
 
 
632fdb4
9d714b0
 
632fdb4
 
 
 
9d714b0
9220522
9d714b0
632fdb4
9d714b0
632fdb4
935512c
632fdb4
ca753f0
9220522
 
632fdb4
 
9d714b0
632fdb4
9d714b0
9220522
632fdb4
 
 
 
9d714b0
632fdb4
 
 
 
9220522
632fdb4
 
f0f4c78
632fdb4
665534e
632fdb4
 
935512c
2562fab
f0f4c78
4e424ea
d701afa
4e424ea
 
f0f4c78
4e424ea
 
 
 
c81f025
4e424ea

import gradio as gr
import re 
import subprocess
import time
import select
from tqdm import tqdm
from huggingface_hub import snapshot_download

#Download model
snapshot_download(
    repo_id = "Wan-AI/Wan2.1-T2V-1.3B",
    local_dir = "./Wan2.1-T2V-1.3B"
)

def infer(prompt, progress=gr.Progress(track_tqdm=True)):
    
    # Configuration
    total_process_steps = 11          # Total INFO messages expected
    irrelevant_steps = 4              # First 4 INFO messages are ignored
    relevant_steps = total_process_steps - irrelevant_steps  # 7 overall (relevant) steps

    # Create overall process progress bar (Level 1)
    overall_bar = tqdm(total=relevant_steps, desc="Overall Process", position=1,
                       ncols=120, dynamic_ncols=False, leave=True)
    processed_steps = 0

    # Regex for video generation progress (Level 3)
    progress_pattern = re.compile(r"(\d+)%\|.*\| (\d+)/(\d+)")
    video_progress_bar = None

    # Variables for sub-step progress bar (Level 2)
    # We use a tick total of 500 ticks = 20 seconds (each tick = 40ms)
    sub_bar = None
    sub_ticks = 0
    sub_tick_total = 500
    # Flag indicating whether we're still waiting for the first relevant step.
    waiting_for_first_relevant = True

    command = [
        "python", "-u", "-m", "generate",  # using -u for unbuffered output
        "--task", "t2v-1.3B",
        "--size", "832*480",
        "--ckpt_dir", "./Wan2.1-T2V-1.3B",
        "--sample_shift", "8",
        "--sample_guide_scale", "6",
        "--prompt", prompt,
        "--save_file", "generated_video.mp4"
    ]

    process = subprocess.Popen(command,
                               stdout=subprocess.PIPE,
                               stderr=subprocess.STDOUT,
                               text=True,
                               bufsize=1)

    while True:
        # Poll stdout with a 40ms timeout.
        rlist, _, _ = select.select([process.stdout], [], [], 0.04)
        if rlist:
            line = process.stdout.readline()
            if not line:
                break
            stripped_line = line.strip()
            if not stripped_line:
                continue

            # Check if line matches video generation progress (Level 3)
            progress_match = progress_pattern.search(stripped_line)
            if progress_match:
                # Before entering video phase, cancel any active sub-step bar.
                if sub_bar is not None:
                    if sub_ticks < sub_tick_total:
                        sub_bar.update(sub_tick_total - sub_ticks)
                    sub_bar.close()
                    overall_bar.update(1)
                    overall_bar.refresh()
                    sub_bar = None
                    sub_ticks = 0
                # Enter video phase.
                current = int(progress_match.group(2))
                total = int(progress_match.group(3))
                if video_progress_bar is None:
                    video_progress_bar = tqdm(total=total, desc="Video Generation", position=0,
                                              ncols=120, dynamic_ncols=True, leave=True)
                video_progress_bar.update(current - video_progress_bar.n)
                video_progress_bar.refresh()
                # When video generation completes, update overall bar.
                if video_progress_bar.n >= video_progress_bar.total:
                    overall_bar.update(1)
                    overall_bar.refresh()
                    video_progress_bar.close()
                    video_progress_bar = None
                continue

            # Process INFO messages.
            if "INFO:" in stripped_line:
                parts = stripped_line.split("INFO:", 1)
                msg = parts[1].strip() if len(parts) > 1 else ""
                print(stripped_line)

                # For the first 4 INFO messages, we simply increment processed_steps.
                if processed_steps < irrelevant_steps:
                    processed_steps += 1
                    # If we're waiting for the first relevant step, start a waiting sub-bar if not already started.
                    if waiting_for_first_relevant and sub_bar is None:
                        sub_bar = tqdm(total=sub_tick_total, desc="Waiting for first step...", position=2,
                                       ncols=120, dynamic_ncols=False, leave=True)
                        sub_ticks = 0
                    # Continue reading logs.
                    continue
                else:
                    # Now we are in the relevant phase.
                    waiting_for_first_relevant = False
                    # If a sub-bar exists (either waiting or from a previous step), finish it.
                    if sub_bar is not None:
                        if sub_ticks < sub_tick_total:
                            sub_bar.update(sub_tick_total - sub_ticks)
                        sub_bar.close()
                        overall_bar.update(1)
                        overall_bar.refresh()
                        sub_bar = None
                        sub_ticks = 0
                    # Start a new sub-step bar with the current INFO message.
                    sub_bar = tqdm(total=sub_tick_total, desc=msg, position=2,
                                   ncols=120, dynamic_ncols=False, leave=True)
                    sub_ticks = 0
                continue
            else:
                print(stripped_line)
        else:
            # No new data within 40ms.
            # If a sub-bar is active, update it.
            if sub_bar is not None:
                sub_bar.update(1)
                sub_ticks += 1
                sub_bar.refresh()
                if sub_ticks >= sub_tick_total:
                    # 20 seconds have elapsed; finish this sub-step.
                    sub_bar.close()
                    overall_bar.update(1)
                    overall_bar.refresh()
                    sub_bar = None
                    sub_ticks = 0

        if process.poll() is not None:
            break

    # Drain remaining output.
    for line in process.stdout:
        print(line.strip())
    process.wait()
    if video_progress_bar is not None:
        video_progress_bar.close()
    if sub_bar is not None:
        sub_bar.close()
    overall_bar.close()
    
    if process.returncode == 0:
        print("Command executed successfully.")
        return "generated_video.mp4"
    else:
        print("Error executing command.")
        raise Exception("Error executing command")

with gr.Blocks() as demo:
    with gr.Column():
        gr.Markdown("# Wan 2.1")
        prompt = gr.Textbox(label="Prompt")
        submit_btn = gr.Button("Submit")
        video_res = gr.Video(label="Generated Video")

    submit_btn.click(
        fn = infer,
        inputs = [prompt],
        outputs = [video_res]
    )

demo.queue().launch(show_error=True, show_api=False, ssr_mode=False)