Spaces:

Sergidev
/

Illustration-Text-To-Video

Paused

App Files Files Community

Sergidev commited on Feb 15

Commit

7b7a9c0

1 Parent(s): d83ac8a

v2

Browse files

Files changed (1) hide show

demo_app.py +50 -18

demo_app.py CHANGED Viewed

@@ -47,8 +47,8 @@ pipe.vae = pipe.vae.to("cuda")
 pipe = pipe.to("cuda")
 pipe.load_lora_weights(
-    "calcuis/hyvid",
-    weight_name="hyvid-lora-mila3d.safetensors",
     adapter_name="hyvid_lora_adapter"
 )
 pipe.set_adapters("hyvid_lora_adapter", 1.2)
@@ -59,7 +59,7 @@ torch.cuda.empty_cache()
 MAX_SEED = np.iinfo(np.int32).max
 MAX_IMAGE_SIZE = 1024
-@spaces.GPU(duration=120)  # Adjusted duration to 120
 def generate(
     prompt,
     height,
@@ -86,13 +86,18 @@ def generate(
             ).frames[0]
         output_path = "output.mp4"
-        export_to_video(output, output_path, fps=fps)  # Use user-defined fps
         torch.cuda.empty_cache()
     gc.collect()
     return output_path
-# Gradio Interface
 css = """
 #col-container {
     margin: 0 auto;
@@ -131,6 +136,18 @@ css = """
     padding: 15px;
     border-radius: 8px;
     margin-bottom: 1em;
 }
 .support-text {
@@ -157,17 +174,25 @@ with gr.Blocks(css=css, theme="dark") as demo:
             """Transform your text descriptions into anime-style videos using state-of-the-art AI technology.
             This space uses the HunyuanVideo model to generate high-quality animated sequences.
-            If you find this useful, please consider ❤️ hearting the space and supporting me on [Ko-Fi](https://ko-fi.com/sergidev)!""",
             elem_classes=["description"]
         )
-        with gr.Row(elem_classes=["prompt-container"]):
-            prompt = gr.Text(
                 label="Prompt",
                 placeholder="Enter your prompt here (e.g., 'a cute anime girl walking in a garden')",
                 show_label=False,
             )
-            run_button = gr.Button("🎨 Generate", variant="primary")
         with gr.Row():
             result = gr.Video(label="Generated Video")
@@ -181,19 +206,19 @@ with gr.Blocks(css=css, theme="dark") as demo:
                 value=-1,
             )
             with gr.Row():
-                height = gr.Slider(  # Fixed order of height and width to match intended use
                     label="Height",
                     minimum=256,
                     maximum=MAX_IMAGE_SIZE,
-                    step=16,  # Make divisible by 16
-                    value=512,
                 )
                 width = gr.Slider(
                     label="Width",
                     minimum=256,
                     maximum=MAX_IMAGE_SIZE,
                     step=16,
-                    value=320,
                 )
             with gr.Row():
                 num_frames = gr.Slider(
@@ -201,30 +226,37 @@ with gr.Blocks(css=css, theme="dark") as demo:
                     minimum=1.0,
                     maximum=257.0,
                     step=1,
-                    value=42,
                 )
                 num_inference_steps = gr.Slider(
                     label="Number of inference steps",
                     minimum=1,
                     maximum=50,
                     step=1,
-                    value=30,
                 )
             fps = gr.Slider(
                 label="Frames per second",
                 minimum=1,
                 maximum=60,
                 step=1,
-                value=14,
             )
     # Event handling
     run_button.click(
         fn=generate,
         inputs=[prompt, height, width, num_frames, num_inference_steps, seed, fps],
-        # Added fps to inputs, fixed height/width order
         outputs=[result],
     )
-# The demo.queue and demo.launch are handled in app.py

 pipe = pipe.to("cuda")
 pipe.load_lora_weights(
+    "sergidev/IllustrationTTV",
+    weight_name="hunyuan_flat_color_v2.safetensors",
     adapter_name="hyvid_lora_adapter"
 )
 pipe.set_adapters("hyvid_lora_adapter", 1.2)
 MAX_SEED = np.iinfo(np.int32).max
 MAX_IMAGE_SIZE = 1024
+@spaces.GPU(duration=120)
 def generate(
     prompt,
     height,
             ).frames[0]
         output_path = "output.mp4"
+        export_to_video(output, output_path, fps=fps)
         torch.cuda.empty_cache()
     gc.collect()
     return output_path
+def apply_preset(preset_name, *current_values):
+    if preset_name == "Higher Resolution":
+        return [608, 448, 24, 29, 12]
+    elif preset_name == "More Frames":
+        return [512, 320, 42, 30, 14]
+    return current_values
 css = """
 #col-container {
     margin: 0 auto;
     padding: 15px;
     border-radius: 8px;
     margin-bottom: 1em;
+    width: 100%;
+}
+.prompt-textbox {
+    min-height: 80px !important;
+}
+.preset-buttons {
+    display: flex;
+    gap: 10px;
+    justify-content: center;
+    margin-bottom: 1em;
 }
 .support-text {
             """Transform your text descriptions into anime-style videos using state-of-the-art AI technology.
             This space uses the HunyuanVideo model to generate high-quality animated sequences.
+            If you find this useful, please consider giving the space a ❤️ and supporting me on [Ko-Fi](https://ko-fi.com/sergidev)!""",
             elem_classes=["description"]
         )
+        with gr.Column(elem_classes=["prompt-container"]):
+            prompt = gr.Textbox(
                 label="Prompt",
                 placeholder="Enter your prompt here (e.g., 'a cute anime girl walking in a garden')",
                 show_label=False,
+                elem_classes=["prompt-textbox"],
+                lines=3
             )
+        with gr.Row():
+            run_button = gr.Button("🎨 Generate", variant="primary", size="lg")
+        with gr.Row(elem_classes=["preset-buttons"]):
+            preset_high_res = gr.Button("📺 Higher Resolution Preset")
+            preset_more_frames = gr.Button("🎞️ More Frames Preset")
         with gr.Row():
             result = gr.Video(label="Generated Video")
                 value=-1,
             )
             with gr.Row():
+                height = gr.Slider(
                     label="Height",
                     minimum=256,
                     maximum=MAX_IMAGE_SIZE,
+                    step=16,
+                    value=608,
                 )
                 width = gr.Slider(
                     label="Width",
                     minimum=256,
                     maximum=MAX_IMAGE_SIZE,
                     step=16,
+                    value=448,
                 )
             with gr.Row():
                 num_frames = gr.Slider(
                     minimum=1.0,
                     maximum=257.0,
                     step=1,
+                    value=24,
                 )
                 num_inference_steps = gr.Slider(
                     label="Number of inference steps",
                     minimum=1,
                     maximum=50,
                     step=1,
+                    value=29,
                 )
             fps = gr.Slider(
                 label="Frames per second",
                 minimum=1,
                 maximum=60,
                 step=1,
+                value=12,
             )
     # Event handling
     run_button.click(
         fn=generate,
         inputs=[prompt, height, width, num_frames, num_inference_steps, seed, fps],
         outputs=[result],
     )
+    # Preset button handlers
+    preset_high_res.click(
+        fn=lambda: apply_preset("Higher Resolution"),
+        outputs=[height, width, num_frames, num_inference_steps, fps]
+    )
+    preset_more_frames.click(
+        fn=lambda: apply_preset("More Frames"),
+        outputs=[height, width, num_frames, num_inference_steps, fps]
+    )