text2video

Sleeping

App Files Files Community

ozilion commited on Jun 18

Commit

c40d82c

verified ·

1 Parent(s): 05424ef

Update app.py

Browse files

Files changed (1) hide show

app.py +342 -253

app.py CHANGED Viewed

@@ -7,7 +7,7 @@ import tempfile
 from typing import Optional, Tuple
 import time
-# ZeroGPU support (even without detection)
 try:
     import spaces
     SPACES_AVAILABLE = True
@@ -15,7 +15,7 @@ except ImportError:
     SPACES_AVAILABLE = False
     class spaces:
         @staticmethod
-        def GPU(duration=240):
             def decorator(func): return func
             return decorator
@@ -24,69 +24,42 @@ IS_ZERO_GPU = os.environ.get("SPACES_ZERO_GPU") == "true"
 IS_SPACES = os.environ.get("SPACE_ID") is not None
 HAS_CUDA = torch.cuda.is_available()
-print(f"🚀 H200 MIG Environment: ZeroGPU={IS_ZERO_GPU}, Spaces={IS_SPACES}, CUDA={HAS_CUDA}")
-# Working models based on your diagnostic
-WORKING_MODELS = [
     {
-        "id": "Lightricks/LTX-Video",
-        "name": "LTX-Video",
-        "pipeline_class": "DiffusionPipeline",
-        "variant": None,  # No fp16 variant available
-        "use_safetensors": False,  # Use .bin files
-        "resolution": (512, 512),
-        "max_frames": 50,
         "dtype": torch.bfloat16,
         "priority": 1,
-        "description": "LTX-Video via DiffusionPipeline (no variant)"
     },
     {
-        "id": "THUDM/CogVideoX-5b",
-        "name": "CogVideoX-5B",
-        "pipeline_class": "CogVideoXPipeline",
-        "variant": None,
-        "use_safetensors": True,
-        "resolution": (720, 480),
         "max_frames": 49,
         "dtype": torch.bfloat16,
         "priority": 2,
-        "description": "CogVideo 5B model - proven to work"
     },
     {
-        "id": "cerspense/zeroscope_v2_576w",
-        "name": "Zeroscope V2",
         "pipeline_class": "DiffusionPipeline",
-        "variant": None,  # No fp16 variant
-        "use_safetensors": False,  # Use .bin files
-        "resolution": (576, 320),
-        "max_frames": 24,
-        "dtype": torch.float16,
         "priority": 3,
-        "description": "Zeroscope without safetensors"
-    },
-    {
-        "id": "damo-vilab/text-to-video-ms-1.7b",
-        "name": "ModelScope T2V",
-        "pipeline_class": "DiffusionPipeline",
-        "variant": None,
-        "use_safetensors": False,
-        "resolution": (256, 256),
-        "max_frames": 16,
-        "dtype": torch.float16,
-        "priority": 4,
-        "description": "ModelScope reliable fallback"
-    },
-    {
-        "id": "ali-vilab/text-to-video-ms-1.7b",
-        "name": "AliVilab T2V",
-        "pipeline_class": "DiffusionPipeline",
-        "variant": None,
-        "use_safetensors": False,
-        "resolution": (256, 256),
-        "max_frames": 16,
-        "dtype": torch.float16,
-        "priority": 5,
-        "description": "AliVilab alternative"
     }
 ]
@@ -96,194 +69,230 @@ MODEL_INFO = None
 LOADING_LOGS = []
 def log_loading(message):
-    """Enhanced logging"""
     global LOADING_LOGS
-    print(message)
-    LOADING_LOGS.append(f"{time.strftime('%H:%M:%S')} - {message}")
 def get_h200_memory():
-    """Get H200 MIG memory stats"""
     if HAS_CUDA:
         try:
             total = torch.cuda.get_device_properties(0).total_memory / (1024**3)
             allocated = torch.cuda.memory_allocated(0) / (1024**3)
-            return total, allocated
         except:
-            return 0, 0
-    return 0, 0
-def load_working_model():
-    """Load first working model with H200 MIG optimizations"""
     global MODEL, MODEL_INFO, LOADING_LOGS
     if MODEL is not None:
         return True
     LOADING_LOGS = []
-    log_loading("🚀 H200 MIG (69.5GB) model loading started...")
-    total_mem, allocated_mem = get_h200_memory()
-    log_loading(f"💾 Initial H200 memory: {total_mem:.1f}GB total, {allocated_mem:.1f}GB used")
-    # Sort by priority
-    sorted_models = sorted(WORKING_MODELS, key=lambda x: x["priority"])
     for model_config in sorted_models:
-        if try_load_specific_model(model_config):
             return True
-    log_loading("❌ All models failed on H200 MIG")
     return False
-def try_load_specific_model(config):
-    """Try loading a specific model with exact configuration"""
     global MODEL, MODEL_INFO
     model_id = config["id"]
     model_name = config["name"]
-    log_loading(f"🔄 Attempting {model_name}...")
-    log_loading(f"  📋 Config: {config['pipeline_class']}, variant={config['variant']}, safetensors={config['use_safetensors']}")
     try:
-        # Clear memory first
         if HAS_CUDA:
             torch.cuda.empty_cache()
         gc.collect()
-        # Import appropriate pipeline
         if config["pipeline_class"] == "CogVideoXPipeline":
             from diffusers import CogVideoXPipeline
             PipelineClass = CogVideoXPipeline
         else:
-            from diffusers import DiffusionPipeline
             PipelineClass = DiffusionPipeline
-        # Prepare loading parameters
-        load_params = {
-            "torch_dtype": config["dtype"],
-            "trust_remote_code": True
-        }
-        # Add variant only if specified
-        if config["variant"]:
-            load_params["variant"] = config["variant"]
-        # Add safetensors setting
-        if config["use_safetensors"]:
-            load_params["use_safetensors"] = True
-        log_loading(f"  📥 Loading with params: {load_params}")
-        # Load model
-        pipe = PipelineClass.from_pretrained(model_id, **load_params)
-        # Move to H200 MIG GPU
         if HAS_CUDA:
             pipe = pipe.to("cuda")
-            log_loading(f"  📱 Moved to H200 MIG CUDA")
-        # H200 MIG optimizations (69.5GB is plenty!)
-        if hasattr(pipe, 'enable_vae_slicing'):
-            pipe.enable_vae_slicing()
-            log_loading(f"  ⚡ VAE slicing enabled")
-        if hasattr(pipe, 'enable_vae_tiling'):
-            pipe.enable_vae_tiling()
-            log_loading(f"  ⚡ VAE tiling enabled")
-        if hasattr(pipe, 'enable_memory_efficient_attention'):
-            pipe.enable_memory_efficient_attention()
-            log_loading(f"  ⚡ Memory efficient attention enabled")
-        # Don't use CPU offload on H200 - keep everything in GPU
-        log_loading(f"  🚀 Keeping model fully in H200 GPU memory")
         # Memory check after loading
-        total_mem, allocated_mem = get_h200_memory()
-        log_loading(f"  💾 Post-load memory: {allocated_mem:.1f}GB used / {total_mem:.1f}GB total")
         MODEL = pipe
         MODEL_INFO = config
-        log_loading(f"✅ {model_name} loaded successfully on H200 MIG!")
         return True
     except Exception as e:
         log_loading(f"❌ {model_name} failed: {str(e)}")
-        # Clear memory before next attempt
         if HAS_CUDA:
             torch.cuda.empty_cache()
         gc.collect()
         return False
-@spaces.GPU(duration=240) if SPACES_AVAILABLE else lambda x: x
-def generate_video(
     prompt: str,
     negative_prompt: str = "",
-    num_frames: int = 25,
-    num_inference_steps: int = 25,
-    guidance_scale: float = 7.5,
     seed: int = -1
 ) -> Tuple[Optional[str], str]:
-    """Generate video with H200 MIG power"""
     global MODEL, MODEL_INFO
-    # Load model if needed
-    if not load_working_model():
-        logs = "\n".join(LOADING_LOGS[-10:])  # Last 10 log entries
-        return None, f"❌ Model loading failed on H200 MIG\n\nRecent logs:\n{logs}"
     # Input validation
     if not prompt.strip():
-        return None, "❌ Please enter a valid prompt."
-    # Get model constraints
     max_frames = MODEL_INFO["max_frames"]
-    width, height = MODEL_INFO["resolution"]
-    # Adjust parameters for model
-    num_frames = min(max(num_frames, 8), max_frames)
     try:
-        # H200 MIG memory management
         start_memory = torch.cuda.memory_allocated(0) / (1024**3) if HAS_CUDA else 0
-        # Set seed
         if seed == -1:
             seed = np.random.randint(0, 2**32 - 1)
         device = "cuda" if HAS_CUDA else "cpu"
         generator = torch.Generator(device=device).manual_seed(seed)
-        log_loading(f"🎬 H200 MIG Generation: {MODEL_INFO['name']}")
-        log_loading(f"📐 {width}x{height}, {num_frames} frames, {num_inference_steps} steps")
         start_time = time.time()
-        # Generate with H200 MIG autocast
-        with torch.autocast(device, dtype=MODEL_INFO["dtype"]):
-            # Prepare generation arguments
             gen_kwargs = {
                 "prompt": prompt,
-                "num_frames": num_frames,
                 "height": height,
                 "width": width,
                 "num_inference_steps": num_inference_steps,
                 "guidance_scale": guidance_scale,
-                "generator": generator
             }
-            # Add negative prompt if provided
             if negative_prompt.strip():
                 gen_kwargs["negative_prompt"] = negative_prompt
-            # Model-specific adjustments
-            if MODEL_INFO["name"] == "CogVideoX-5B":
                 gen_kwargs["num_videos_per_prompt"] = 1
-            log_loading(f"🚀 Starting H200 MIG generation...")
             result = MODEL(**gen_kwargs)
         end_time = time.time()
@@ -292,213 +301,293 @@ def generate_video(
         # Extract video frames
         if hasattr(result, 'frames'):
             video_frames = result.frames[0]
         elif hasattr(result, 'videos'):
             video_frames = result.videos[0]
         else:
-            return None, "❌ Could not extract video frames"
-        # Export video
         with tempfile.NamedTemporaryFile(suffix=".mp4", delete=False) as tmp_file:
             from diffusers.utils import export_to_video
-            fps = 8
-            export_to_video(video_frames, tmp_file.name, fps=fps)
             video_path = tmp_file.name
         # Memory stats
         end_memory = torch.cuda.memory_allocated(0) / (1024**3) if HAS_CUDA else 0
         memory_used = end_memory - start_memory
-        success_msg = f"""✅ **H200 MIG Video Generated!**
-🤖 **Model:** {MODEL_INFO['name']}
 📝 **Prompt:** {prompt}
-🎬 **Frames:** {num_frames} @ {fps} FPS
 📐 **Resolution:** {width}x{height}
-⚙️ **Inference Steps:** {num_inference_steps}
-🎯 **Guidance Scale:** {guidance_scale}
 🎲 **Seed:** {seed}
-⏱️ **Generation Time:** {generation_time:.1f}s
 🖥️ **Device:** H200 MIG (69.5GB)
 💾 **Memory Used:** {memory_used:.1f}GB
-🎥 **Video Length:** {num_frames/fps:.1f}s
-📋 **Notes:** {MODEL_INFO['description']}"""
-        log_loading(f"✅ Generation completed in {generation_time:.1f}s")
         return video_path, success_msg
     except torch.cuda.OutOfMemoryError:
-        torch.cuda.empty_cache()
         gc.collect()
-        return None, "❌ H200 MIG memory exceeded (rare!). Try reducing parameters."
     except Exception as e:
         if HAS_CUDA:
             torch.cuda.empty_cache()
         gc.collect()
-        return None, f"❌ H200 MIG generation failed: {str(e)}"
 def get_loading_logs():
-    """Return formatted loading logs"""
     global LOADING_LOGS
     if not LOADING_LOGS:
         return "No loading attempts yet."
     return "\n".join(LOADING_LOGS)
-def get_h200_status():
-    """Get H200 MIG specific status"""
-    total_mem, allocated_mem = get_h200_memory()
-    status = f"""## 🚀 H200 MIG Status
-**🖥️ Hardware:**
-- GPU: NVIDIA H200 MIG 3g.71gb
-- Total Memory: {total_mem:.1f} GB
-- Allocated: {allocated_mem:.1f} GB
-- Free: {total_mem - allocated_mem:.1f} GB
-**🤖 Current Model:**"""
-    if MODEL is not None:
-        status += f"""
-- ✅ **{MODEL_INFO['name']}** loaded and ready
-- 📐 Resolution: {MODEL_INFO['resolution']}
-- 🎬 Max Frames: {MODEL_INFO['max_frames']}
-- 💾 Memory Usage: {allocated_mem:.1f}GB
-- 📋 Details: {MODEL_INFO['description']}"""
-    else:
-        status += f"""
-- ⏳ No model loaded yet
-- 🔄 Will auto-load on first generation"""
-    status += f"""
-**💡 H200 MIG Advantages:**
-- 69.5GB dedicated memory
-- Isolated GPU partition
-- Consistent performance
-- No interference from other workloads"""
-    return status
-def force_reload():
-    """Force model reload"""
-    global MODEL, MODEL_INFO
-    MODEL = None
-    MODEL_INFO = None
-    torch.cuda.empty_cache()
-    gc.collect()
-    success = load_working_model()
-    logs = "\n".join(LOADING_LOGS[-5:])  # Last 5 entries
-    return f"🔄 **Force Reload Result:** {'✅ Success' if success else '❌ Failed'}\n\nRecent logs:\n{logs}"
-# Create H200 MIG optimized interface
-with gr.Blocks(title="H200 MIG Video Generator", theme=gr.themes.Glass()) as demo:
     gr.Markdown("""
-    # 🚀 H200 MIG Video Generator
-    **NVIDIA H200 MIG 3g.71gb** • **69.5GB Memory** • **Working Models**
     """)
-    # Status bar
     with gr.Row():
         gr.Markdown("""
-        <div style="background: linear-gradient(45deg, #FF6B6B, #4ECDC4); padding: 10px; border-radius: 10px; text-align: center; color: white; font-weight: bold;">
-        🔥 H200 MIG ACTIVE - OPTIMIZED FOR YOUR SETUP 🔥
         </div>
         """)
-    with gr.Tab("🎥 Generate Video"):
         with gr.Row():
             with gr.Column(scale=1):
                 prompt_input = gr.Textbox(
-                    label="📝 Video Prompt",
-                    placeholder="A majestic eagle soaring through mountain peaks at golden hour, cinematic shot with dramatic lighting...",
-                    lines=4
                 )
                 negative_prompt_input = gr.Textbox(
-                    label="🚫 Negative Prompt",
-                    placeholder="blurry, low quality, distorted, pixelated, static...",
                     lines=2
                 )
-                with gr.Accordion("⚙️ H200 MIG Settings", open=True):
                     with gr.Row():
-                        num_frames = gr.Slider(8, 50, value=25, step=1, label="🎬 Frames")
-                        num_steps = gr.Slider(15, 50, value=25, step=1, label="⚙️ Steps")
                     with gr.Row():
-                        guidance_scale = gr.Slider(1.0, 15.0, value=7.5, step=0.5, label="🎯 Guidance")
-                        seed = gr.Number(value=-1, precision=0, label="🎲 Seed")
-                generate_btn = gr.Button("🚀 Generate on H200 MIG", variant="primary", size="lg")
                 gr.Markdown("""
-                **⏱️ Generation:** 1-3 minutes on H200 MIG
-                **💡 Auto-detects:** Best working model for your setup
                 """)
             with gr.Column(scale=1):
-                video_output = gr.Video(label="🎥 H200 MIG Generated Video", height=400)
-                result_text = gr.Textbox(label="📋 Generation Report", lines=10, show_copy_button=True)
         generate_btn.click(
-            fn=generate_video,
-            inputs=[prompt_input, negative_prompt_input, num_frames, num_steps, guidance_scale, seed],
             outputs=[video_output, result_text]
         )
-        # H200 MIG optimized examples
         gr.Examples(
             examples=[
                 [
-                    "A majestic golden eagle soaring through misty mountain peaks at sunrise",
-                    "blurry, low quality, static",
-                    25, 25, 7.5, 42
                 ],
                 [
-                    "Ocean waves crashing against rocks during sunset, cinematic view",
-                    "pixelated, distorted, watermark",
-                    30, 30, 8.0, 123
                 ],
                 [
-                    "A peaceful cat sleeping in a sunny garden with flowers",
-                    "dark, gloomy, low quality",
-                    20, 20, 7.0, 456
                 ],
                 [
-                    "Time-lapse of clouds moving over a mountain landscape",
-                    "static, boring, blurry",
-                    35, 35, 7.5, 789
                 ]
             ],
-            inputs=[prompt_input, negative_prompt_input, num_frames, num_steps, guidance_scale, seed]
         )
-    with gr.Tab("🔧 H200 MIG Status"):
         with gr.Row():
-            status_btn = gr.Button("🔍 Check H200 Status", variant="secondary")
-            logs_btn = gr.Button("📋 View Loading Logs", variant="secondary")
-            reload_btn = gr.Button("🔄 Force Reload", variant="secondary")
         status_output = gr.Markdown()
-        logs_output = gr.Textbox(label="Detailed Loading Logs", lines=15, show_copy_button=True)
-        reload_output = gr.Markdown()
-        status_btn.click(fn=get_h200_status, outputs=status_output)
         logs_btn.click(fn=get_loading_logs, outputs=logs_output)
-        reload_btn.click(fn=force_reload, outputs=reload_output)
         # Auto-load status
-        demo.load(fn=get_h200_status, outputs=status_output)
 if __name__ == "__main__":
-    demo.queue(max_size=3)
     demo.launch(
         share=False,
         server_name="0.0.0.0",

 from typing import Optional, Tuple
 import time
+# ZeroGPU support
 try:
     import spaces
     SPACES_AVAILABLE = True
     SPACES_AVAILABLE = False
     class spaces:
         @staticmethod
+        def GPU(duration=300):
             def decorator(func): return func
             return decorator
 IS_SPACES = os.environ.get("SPACE_ID") is not None
 HAS_CUDA = torch.cuda.is_available()
+print(f"🚀 H200 Premium Setup: ZeroGPU={IS_ZERO_GPU}, Spaces={IS_SPACES}, CUDA={HAS_CUDA}")
+# PREMIUM MODELS ONLY - No low quality fallbacks
+PREMIUM_MODELS = [
     {
+        "id": "THUDM/CogVideoX-5b",
+        "name": "CogVideoX-5B",
+        "pipeline_class": "CogVideoXPipeline",
+        "resolution_options": [(720, 480), (480, 720)],
+        "max_frames": 49,
         "dtype": torch.bfloat16,
+        "fps": 8,
         "priority": 1,
+        "description": "5B parameter video model - high quality"
     },
     {
+        "id": "THUDM/CogVideoX-2b",
+        "name": "CogVideoX-2B",
+        "pipeline_class": "CogVideoXPipeline",
+        "resolution_options": [(720, 480), (480, 720)],
         "max_frames": 49,
         "dtype": torch.bfloat16,
+        "fps": 8,
         "priority": 2,
+        "description": "2B parameter model - faster generation"
     },
     {
+        "id": "Lightricks/LTX-Video",
+        "name": "LTX-Video",
         "pipeline_class": "DiffusionPipeline",
+        "resolution_options": [(512, 512), (768, 768)],
+        "max_frames": 121,  # LTX supports longer videos
+        "dtype": torch.bfloat16,
+        "fps": 24,  # Higher FPS
         "priority": 3,
+        "description": "Professional video generation model"
     }
 ]
 LOADING_LOGS = []
 def log_loading(message):
+    """Enhanced logging with timestamps"""
     global LOADING_LOGS
+    timestamp = time.strftime('%H:%M:%S')
+    formatted_msg = f"[{timestamp}] {message}"
+    print(formatted_msg)
+    LOADING_LOGS.append(formatted_msg)
 def get_h200_memory():
+    """Get detailed H200 memory stats"""
     if HAS_CUDA:
         try:
             total = torch.cuda.get_device_properties(0).total_memory / (1024**3)
             allocated = torch.cuda.memory_allocated(0) / (1024**3)
+            reserved = torch.cuda.memory_reserved(0) / (1024**3)
+            return total, allocated, reserved
         except:
+            return 0, 0, 0
+    return 0, 0, 0
+def load_premium_model():
+    """Load premium models only - no fallbacks"""
     global MODEL, MODEL_INFO, LOADING_LOGS
     if MODEL is not None:
         return True
     LOADING_LOGS = []
+    log_loading("🎯 H200 Premium Model Loading - QUALITY PRIORITY")
+    total_mem, allocated_mem, reserved_mem = get_h200_memory()
+    log_loading(f"💾 H200 Memory: {total_mem:.1f}GB total, {allocated_mem:.1f}GB allocated, {reserved_mem:.1f}GB reserved")
+    # Sort by priority (premium first)
+    sorted_models = sorted(PREMIUM_MODELS, key=lambda x: x["priority"])
     for model_config in sorted_models:
+        if try_load_premium_model(model_config):
             return True
+    log_loading("❌ All premium models failed - check model availability")
     return False
+def try_load_premium_model(config):
+    """Try loading premium model with optimized settings"""
     global MODEL, MODEL_INFO
     model_id = config["id"]
     model_name = config["name"]
+    log_loading(f"🔄 Loading {model_name} (Premium)...")
+    log_loading(f"  📋 Target: {config['pipeline_class']}, {config['max_frames']} frames, {config['fps']} fps")
     try:
+        # Clear H200 memory
         if HAS_CUDA:
             torch.cuda.empty_cache()
+            torch.cuda.synchronize()
         gc.collect()
+        # Import specific pipeline
         if config["pipeline_class"] == "CogVideoXPipeline":
             from diffusers import CogVideoXPipeline
             PipelineClass = CogVideoXPipeline
+            log_loading(f"  📥 Using CogVideoXPipeline...")
         else:
+            from diffusers import DiffusionPipeline
             PipelineClass = DiffusionPipeline
+            log_loading(f"  📥 Using DiffusionPipeline...")
+        # Load with premium settings
+        log_loading(f"  🔄 Downloading/Loading model...")
+        pipe = PipelineClass.from_pretrained(
+            model_id,
+            torch_dtype=config["dtype"],
+            trust_remote_code=True,
+            # No variant, no use_safetensors restrictions
+        )
+        # Move to H200 and optimize
         if HAS_CUDA:
+            log_loading(f"  📱 Moving to H200 CUDA...")
             pipe = pipe.to("cuda")
+            # Premium optimizations for H200's 69.5GB
+            if hasattr(pipe, 'enable_vae_slicing'):
+                pipe.enable_vae_slicing()
+                log_loading(f"  ⚡ VAE slicing enabled")
+            if hasattr(pipe, 'enable_vae_tiling'):
+                pipe.enable_vae_tiling()
+                log_loading(f"  ⚡ VAE tiling enabled")
+            if hasattr(pipe, 'enable_memory_efficient_attention'):
+                pipe.enable_memory_efficient_attention()
+                log_loading(f"  ⚡ Memory efficient attention enabled")
+            # For H200's large memory, keep everything in GPU
+            log_loading(f"  🚀 Keeping full model in H200 GPU memory")
         # Memory check after loading
+        total_mem, allocated_mem, reserved_mem = get_h200_memory()
+        log_loading(f"  💾 Post-load: {allocated_mem:.1f}GB allocated, {reserved_mem:.1f}GB reserved")
+        # Validate model capabilities
+        expected_frames = config["max_frames"]
+        expected_fps = config["fps"]
+        log_loading(f"  ✅ {model_name} ready: {expected_frames} max frames @ {expected_fps} fps")
         MODEL = pipe
         MODEL_INFO = config
+        log_loading(f"🎯 SUCCESS: {model_name} loaded for premium generation!")
         return True
     except Exception as e:
         log_loading(f"❌ {model_name} failed: {str(e)}")
+        # Clear memory thoroughly
         if HAS_CUDA:
             torch.cuda.empty_cache()
+            torch.cuda.synchronize()
         gc.collect()
         return False
+@spaces.GPU(duration=300) if SPACES_AVAILABLE else lambda x: x
+def generate_premium_video(
     prompt: str,
     negative_prompt: str = "",
+    num_frames: int = 49,
+    resolution: str = "720x480",
+    num_inference_steps: int = 50,
+    guidance_scale: float = 6.0,
     seed: int = -1
 ) -> Tuple[Optional[str], str]:
+    """Generate premium quality video with proper parameters"""
     global MODEL, MODEL_INFO
+    # Load premium model
+    if not load_premium_model():
+        logs = "\n".join(LOADING_LOGS[-5:])
+        return None, f"❌ No premium models available\n\nLogs:\n{logs}"
     # Input validation
     if not prompt.strip():
+        return None, "❌ Please enter a detailed prompt for premium generation."
+    if len(prompt) < 10:
+        return None, "❌ Please provide a more detailed prompt (minimum 10 characters)."
+    # Parse resolution
+    try:
+        width, height = map(int, resolution.split('x'))
+    except:
+        width, height = MODEL_INFO["resolution_options"][0]
+    # Validate resolution
+    if (width, height) not in MODEL_INFO["resolution_options"]:
+        width, height = MODEL_INFO["resolution_options"][0]
+        log_loading(f"⚠️ Resolution adjusted to {width}x{height}")
+    # Validate frames
     max_frames = MODEL_INFO["max_frames"]
+    num_frames = min(max(num_frames, 16), max_frames)  # Minimum 16 for quality
+    # Model-specific parameter optimization
+    if MODEL_INFO["name"].startswith("CogVideoX"):
+        # CogVideoX optimal parameters
+        guidance_scale = max(6.0, min(guidance_scale, 7.0))  # CogVideoX sweet spot
+        num_inference_steps = max(50, num_inference_steps)  # Higher steps for quality
+    elif MODEL_INFO["name"] == "LTX-Video":
+        # LTX-Video optimal parameters
+        guidance_scale = max(7.0, min(guidance_scale, 8.5))  # LTX sweet spot
+        num_inference_steps = max(30, num_inference_steps)
     try:
+        # H200 memory preparation
         start_memory = torch.cuda.memory_allocated(0) / (1024**3) if HAS_CUDA else 0
+        # Enhanced seed handling
         if seed == -1:
             seed = np.random.randint(0, 2**32 - 1)
         device = "cuda" if HAS_CUDA else "cpu"
         generator = torch.Generator(device=device).manual_seed(seed)
+        log_loading(f"🎬 PREMIUM GENERATION START")
+        log_loading(f"📋 Model: {MODEL_INFO['name']}")
+        log_loading(f"📐 Resolution: {width}x{height}")
+        log_loading(f"🎞️ Frames: {num_frames} @ {MODEL_INFO['fps']} fps = {num_frames/MODEL_INFO['fps']:.1f}s video")
+        log_loading(f"⚙️ Steps: {num_inference_steps}, Guidance: {guidance_scale}")
+        log_loading(f"📝 Prompt: {prompt[:100]}...")
         start_time = time.time()
+        # Premium generation with optimal autocast
+        with torch.autocast(device, dtype=MODEL_INFO["dtype"], enabled=HAS_CUDA):
+            # Prepare generation parameters
             gen_kwargs = {
                 "prompt": prompt,
                 "height": height,
                 "width": width,
+                "num_frames": num_frames,
                 "num_inference_steps": num_inference_steps,
                 "guidance_scale": guidance_scale,
+                "generator": generator,
             }
+            # Add negative prompt for quality
             if negative_prompt.strip():
                 gen_kwargs["negative_prompt"] = negative_prompt
+            else:
+                # Default negative prompt for premium quality
+                default_negative = "blurry, low quality, distorted, pixelated, compression artifacts, watermark, text, signature, amateur, static, boring"
+                gen_kwargs["negative_prompt"] = default_negative
+                log_loading(f"🚫 Using default negative prompt for quality")
+            # Model-specific parameters
+            if MODEL_INFO["name"].startswith("CogVideoX"):
                 gen_kwargs["num_videos_per_prompt"] = 1
+                log_loading(f"🎥 CogVideoX generation starting...")
+            # Generate with progress
+            log_loading(f"🚀 H200 generation in progress...")
             result = MODEL(**gen_kwargs)
         end_time = time.time()
         # Extract video frames
         if hasattr(result, 'frames'):
             video_frames = result.frames[0]
+            log_loading(f"📹 Extracted {len(video_frames)} frames")
         elif hasattr(result, 'videos'):
             video_frames = result.videos[0]
+            log_loading(f"📹 Extracted video tensor: {video_frames.shape}")
         else:
+            log_loading(f"❌ Unknown result format: {type(result)}")
+            return None, "❌ Could not extract video frames from result"
+        # Export with proper FPS
+        target_fps = MODEL_INFO["fps"]
+        actual_duration = num_frames / target_fps
         with tempfile.NamedTemporaryFile(suffix=".mp4", delete=False) as tmp_file:
             from diffusers.utils import export_to_video
+            export_to_video(video_frames, tmp_file.name, fps=target_fps)
             video_path = tmp_file.name
+            log_loading(f"🎬 Exported to {tmp_file.name} @ {target_fps} fps")
         # Memory stats
         end_memory = torch.cuda.memory_allocated(0) / (1024**3) if HAS_CUDA else 0
         memory_used = end_memory - start_memory
+        # Success report
+        success_msg = f"""🎯 **PREMIUM H200 VIDEO GENERATED**
+🤖 **Model:** {MODEL_INFO['name']}
 📝 **Prompt:** {prompt}
+🎬 **Video:** {num_frames} frames @ {target_fps} fps = **{actual_duration:.1f} seconds**
 📐 **Resolution:** {width}x{height}
+⚙️ **Quality:** {num_inference_steps} inference steps
+🎯 **Guidance:** {guidance_scale}
 🎲 **Seed:** {seed}
+⏱️ **Generation Time:** {generation_time:.1f}s ({generation_time/60:.1f} minutes)
 🖥️ **Device:** H200 MIG (69.5GB)
 💾 **Memory Used:** {memory_used:.1f}GB
+📋 **Model Notes:** {MODEL_INFO['description']}
+**🎥 Video Quality:** Premium quality with {num_frames} frames over {actual_duration:.1f} seconds"""
+        log_loading(f"✅ PREMIUM generation completed: {actual_duration:.1f}s video in {generation_time:.1f}s")
         return video_path, success_msg
     except torch.cuda.OutOfMemoryError:
+        if HAS_CUDA:
+            torch.cuda.empty_cache()
         gc.collect()
+        return None, "❌ H200 memory exceeded. Try reducing frames or resolution."
     except Exception as e:
         if HAS_CUDA:
             torch.cuda.empty_cache()
         gc.collect()
+        error_msg = str(e)
+        log_loading(f"❌ Generation error: {error_msg}")
+        return None, f"❌ Premium generation failed: {error_msg}"
+def get_model_status():
+    """Get current premium model status"""
+    if MODEL is None:
+        return "⏳ **No premium model loaded** - will auto-load on generation"
+    fps = MODEL_INFO["fps"]
+    max_frames = MODEL_INFO["max_frames"]
+    max_duration = max_frames / fps
+    resolutions = ", ".join([f"{w}x{h}" for w, h in MODEL_INFO["resolution_options"]])
+    return f"""🎯 **{MODEL_INFO['name']} Ready**
+**📋 Premium Capabilities:**
+- **Max Duration:** {max_duration:.1f} seconds ({max_frames} frames @ {fps} fps)
+- **Resolutions:** {resolutions}
+- **Quality:** {MODEL_INFO['description']}
+**⚡ H200 Optimizations:**
+- Full model in GPU memory
+- Memory efficient attention
+- VAE optimizations enabled
+**💡 This model produces {max_duration:.1f} second videos with {max_frames} frames!**"""
 def get_loading_logs():
+    """Get formatted loading logs"""
     global LOADING_LOGS
     if not LOADING_LOGS:
         return "No loading attempts yet."
     return "\n".join(LOADING_LOGS)
+def suggest_premium_settings():
+    """Suggest optimal settings for current model"""
+    if MODEL is None:
+        return "Load a premium model first."
+    model_name = MODEL_INFO['name']
+    max_frames = MODEL_INFO['max_frames']
+    fps = MODEL_INFO['fps']
+    max_duration = max_frames / fps
+    return f"""## 🎯 Optimal Settings for {model_name}
+**🚀 Maximum Quality:**
+- Frames: {max_frames} (full {max_duration:.1f} second video)
+- Inference Steps: 50+
+- Guidance Scale: {6.0 if 'CogVideo' in model_name else 7.5}
+- Resolution: {MODEL_INFO['resolution_options'][-1]}
+**⚖️ Balanced (Recommended):**
+- Frames: {max_frames//2} ({max_frames//2/fps:.1f} second video)
+- Inference Steps: 35-50
+- Guidance Scale: {6.0 if 'CogVideo' in model_name else 7.5}
+**⚡ Fast Test:**
+- Frames: 25 ({25/fps:.1f} second video)
+- Inference Steps: 30
+- Guidance Scale: {6.0 if 'CogVideo' in model_name else 7.5}
+**📝 Premium Prompting Tips:**
+- Be very specific and detailed
+- Include camera movements: "slow zoom", "tracking shot"
+- Describe lighting: "golden hour", "cinematic lighting"
+- Add style: "professional cinematography", "8K quality"
+- Mention motion: "smooth movement", "graceful motion"
+**Example Premium Prompt:**
+"A majestic golden eagle soaring gracefully through misty mountain peaks during golden hour, cinematic tracking shot with shallow depth of field, professional wildlife cinematography, smooth gliding motion, warm sunset lighting, 8K quality"
+Remember: Longer videos need more detailed prompts to maintain coherence!"""
+# Create premium interface
+with gr.Blocks(title="H200 Premium Video Generator", theme=gr.themes.Glass()) as demo:
     gr.Markdown("""
+    # 🎯 H200 Premium Video Generator
+    **Premium Models Only** • **Long-Form Videos** • **Professional Quality**
+    *CogVideoX-5B • LTX-Video • No Low-Quality Fallbacks*
     """)
+    # Premium status
     with gr.Row():
         gr.Markdown("""
+        <div style="background: linear-gradient(45deg, #FFD700, #FF6B6B); padding: 15px; border-radius: 15px; text-align: center; color: white; font-weight: bold; font-size: 18px;">
+        🏆 PREMIUM MODE - H200 MIG 69.5GB - QUALITY PRIORITY 🏆
         </div>
         """)
+    with gr.Tab("🎬 Premium Generation"):
         with gr.Row():
             with gr.Column(scale=1):
                 prompt_input = gr.Textbox(
+                    label="📝 Detailed Video Prompt (Premium Quality)",
+                    placeholder="A breathtaking aerial view of a majestic golden eagle soaring gracefully through dramatic mountain peaks shrouded in morning mist, cinematic wildlife documentary style with slow motion tracking shot, professional cinematography with warm golden hour lighting and shallow depth of field, smooth gliding motion across epic landscape, 8K quality with film grain texture...",
+                    lines=5,
+                    max_lines=8
                 )
                 negative_prompt_input = gr.Textbox(
+                    label="🚫 Negative Prompt (Optional - auto-applied for quality)",
+                    placeholder="blurry, low quality, distorted, pixelated, compression artifacts, watermark, text, signature, amateur, static, boring, jerky motion...",
                     lines=2
                 )
+                with gr.Accordion("🎯 Premium Settings", open=True):
                     with gr.Row():
+                        num_frames = gr.Slider(
+                            minimum=16,
+                            maximum=49,
+                            value=49,
+                            step=1,
+                            label="🎬 Video Frames (16 = 2s, 49 = 6s+)"
+                        )
+                        resolution = gr.Dropdown(
+                            choices=["720x480", "480x720"],
+                            value="720x480",
+                            label="📐 Resolution"
+                        )
                     with gr.Row():
+                        num_steps = gr.Slider(
+                            minimum=30,
+                            maximum=100,
+                            value=50,
+                            step=5,
+                            label="⚙️ Inference Steps (50+ for premium quality)"
+                        )
+                        guidance_scale = gr.Slider(
+                            minimum=4.0,
+                            maximum=10.0,
+                            value=6.0,
+                            step=0.5,
+                            label="🎯 Guidance Scale"
+                        )
+                    seed = gr.Number(
+                        label="🎲 Seed (-1 for random)",
+                        value=-1,
+                        precision=0
+                    )
+                generate_btn = gr.Button(
+                    "🎯 Generate Premium Video",
+                    variant="primary",
+                    size="lg"
+                )
                 gr.Markdown("""
+                **⏱️ Premium Generation:** 2-5 minutes for quality
+                **🎥 Output:** 2-6+ second high-quality videos
+                **💡 Premium Tips:**
+                - Use very detailed, specific prompts
+                - Higher inference steps = better quality
+                - Longer videos need more descriptive prompts
                 """)
             with gr.Column(scale=1):
+                video_output = gr.Video(
+                    label="🎥 Premium H200 Generated Video",
+                    height=400
+                )
+                result_text = gr.Textbox(
+                    label="📋 Premium Generation Report",
+                    lines=12,
+                    show_copy_button=True
+                )
+        # Generate button
         generate_btn.click(
+            fn=generate_premium_video,
+            inputs=[
+                prompt_input, negative_prompt_input, num_frames,
+                resolution, num_steps, guidance_scale, seed
+            ],
             outputs=[video_output, result_text]
         )
+        # Premium examples
         gr.Examples(
             examples=[
                 [
+                    "A majestic golden eagle soaring gracefully through misty mountain peaks during golden hour, cinematic wildlife documentary style with slow motion tracking shot, professional cinematography with warm lighting and shallow depth of field, smooth gliding motion, 8K quality",
+                    "blurry, low quality, static, amateur, pixelated",
+                    49, "720x480", 50, 6.0, 42
                 ],
                 [
+                    "Ocean waves crashing against dramatic coastal cliffs during a storm, professional seascape cinematography with dynamic camera movement, slow motion water spray and foam, dramatic lighting with storm clouds, high contrast and deep blues, cinematic quality",
+                    "calm, peaceful, low quality, static, boring",
+                    41, "720x480", 60, 6.5, 123
                 ],
                 [
+                    "A steaming artisanal coffee cup on rustic wooden table by rain-streaked window, cozy cafe atmosphere with warm ambient lighting, shallow depth of field with bokeh background, steam rising elegantly, professional commercial cinematography, intimate close-up shot",
+                    "cold, harsh lighting, plastic, fake, low quality, distorted",
+                    33, "720x480", 45, 6.0, 456
                 ],
                 [
+                    "Time-lapse of cherry blossom petals falling like snow in traditional Japanese garden with wooden bridge over koi pond, peaceful zen atmosphere with soft natural lighting, seasonal transition captured in cinematic wide shot, perfect composition and color grading",
+                    "modern, urban, chaotic, low quality, static, artificial",
+                    49, "720x480", 55, 6.5, 789
                 ]
             ],
+            inputs=[prompt_input, negative_prompt_input, num_frames, resolution, num_steps, guidance_scale, seed]
         )
+    with gr.Tab("🎯 Premium Status"):
         with gr.Row():
+            status_btn = gr.Button("🔍 Model Status", variant="secondary")
+            logs_btn = gr.Button("📋 Loading Logs", variant="secondary")
+            settings_btn = gr.Button("⚙️ Optimal Settings", variant="secondary")
         status_output = gr.Markdown()
+        logs_output = gr.Textbox(label="Detailed Logs", lines=12, show_copy_button=True)
+        settings_output = gr.Markdown()
+        status_btn.click(fn=get_model_status, outputs=status_output)
         logs_btn.click(fn=get_loading_logs, outputs=logs_output)
+        settings_btn.click(fn=suggest_premium_settings, outputs=settings_output)
         # Auto-load status
+        demo.load(fn=get_model_status, outputs=status_output)
 if __name__ == "__main__":
+    demo.queue(max_size=2)  # Premium quality needs smaller queue
     demo.launch(
         share=False,
         server_name="0.0.0.0",