Spaces:

ginigen
/

Seedance-Free

Running

File size: 20,555 Bytes

dc72519
 
989bf3e
dc72519
 
 
239e0d9
dc72519
989bf3e
 
 
dc72519
989bf3e
239e0d9
dc72519
239e0d9
8f84113
989bf3e
8f84113
 
 
 
 
 
 
239e0d9
989bf3e
bfb51e0
 
989bf3e
 
 
 
 
239e0d9
a5e046f
dc72519
a5e046f
 
 
 
 
 
 
dc72519
 
3558e0d
 
 
 
8f84113
 
 
 
 
9f85f32
8f84113
 
 
 
9f85f32
8f84113
 
9f85f32
8f84113
 
989bf3e
8f84113
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
9f85f32
8f84113
 
 
9f85f32
8f84113
9f85f32
 
8f84113
 
 
989bf3e
8f84113
 
 
 
 
 
989bf3e
 
 
 
 
 
9f85f32
dc72519
a5e046f
 
3558e0d
 
 
 
239e0d9
3558e0d
 
 
 
dc72519
 
a5e046f
 
a8b22a6
 
dc72519
a8b22a6
 
dc72519
989bf3e
 
 
 
84f75cc
989bf3e
 
84f75cc
989bf3e
84f75cc
989bf3e
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
84f75cc
a8b22a6
989bf3e
239e0d9
a5e046f
dc72519
a5e046f
239e0d9
a8b22a6
 
 
239e0d9
dc72519
989bf3e
dc72519
989bf3e
 
 
 
dc72519
989bf3e
 
 
 
 
 
 
 
 
 
a8b22a6
 
 
 
 
 
 
 
 
 
 
 
989bf3e
 
a8b22a6
 
 
989bf3e
a8b22a6
 
 
 
 
 
 
239e0d9
989bf3e
 
a8b22a6
989bf3e
 
 
 
 
 
 
 
 
 
 
dc72519
989bf3e
dc72519
989bf3e
 
 
 
 
a8b22a6
 
 
 
 
 
 
 
 
 
 
 
 
 
 
dc72519
989bf3e
 
3558e0d
989bf3e
 
3558e0d
989bf3e
 
2504a64
989bf3e
 
 
 
dc72519
989bf3e
dc72519
a5e046f
dc72519
 
9f85f32
 
8f84113
 
 
9f85f32
8f84113
989bf3e
8f84113
 
 
 
 
dc72519
8f84113
 
 
 
 
9f85f32
8f84113
9f85f32
8f84113
 
 
 
dc72519
a5e046f
dc72519
a5e046f
8f84113
a5e046f
239e0d9
a5e046f
 
 
dc72519
a5e046f
 
8f84113
989bf3e
 
a5e046f
dc72519
9f85f32
dc72519
3558e0d
989bf3e
dc72519
989bf3e
dc72519
a5e046f
 
dc72519
a5e046f
239e0d9
989bf3e
239e0d9
989bf3e
dc72519
989bf3e
 
84f75cc
dc72519
 
a5e046f
989bf3e
 
 
bfb51e0
 
989bf3e
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
239e0d9
a5e046f
dc72519
a5e046f
 
 
239e0d9
 
a8b22a6
 
 
 
 
 
 
 
 
 
bfb51e0
 
a8b22a6
239e0d9
989bf3e
dc72519
a8b22a6
dc72519
 
a8b22a6
 
dc72519
239e0d9
a5e046f
 
239e0d9
a5e046f
dc72519
a5e046f
989bf3e
dc72519
989bf3e
dc72519
239e0d9
a5e046f
8f84113
 
a5e046f
 
 
989bf3e
8f84113
dc72519
 
 
a5e046f
dc72519
a5e046f
dc72519
3558e0d
 
dc72519
239e0d9
989bf3e
 
239e0d9
a5e046f
dc72519
 
a5e046f
dc72519
 
 
a5e046f
989bf3e
dc72519
239e0d9
 
a5e046f
 
dc72519
a5e046f
dc72519
a5e046f
dc72519
989bf3e
8f84113
 
 
 
 
dc72519
 
989bf3e
dc72519
bfb51e0
 
dc72519
 
8f84113
dc72519
 
 
 
a5e046f
dc72519
a8b22a6
 
 
 
 
989bf3e
8f84113
dc72519
a8b22a6
 
 
 
 
 
 
 
 
 
989bf3e
 
 
 
 
 
 
a5e046f
dc72519
a5e046f
 
 
 
dc72519
239e0d9
a5e046f
dc72519
 
a8b22a6
 
 
 
dc72519
a8b22a6
989bf3e
dc72519
239e0d9
a5e046f
dc72519
 
 
 
 
239e0d9
dc72519
 
 
a8b22a6
dc72519
239e0d9
dc72519
a5e046f
dc72519
 
 
239e0d9
dc72519
 
a8b22a6
dc72519
 
239e0d9
a5e046f
dc72519

#!/usr/bin/env python3
"""
AI Video Generator with Gradio - WaveSpeed API Version
Single file application - app.py
"""

import os
import gradio as gr
import requests
import json
import time
import base64
from PIL import Image
import io
from datetime import datetime
import tempfile

# Try to import video processing libraries for watermark
try:
    import cv2
    import numpy as np
    VIDEO_PROCESSING_AVAILABLE = True
except ImportError:
    VIDEO_PROCESSING_AVAILABLE = False
    print("Warning: cv2 not available. Watermark feature will be disabled.")

# API keys setup from environment variables
API_KEY_T2V = os.getenv("WAVESPEED_API_KEY_T2V", "946b77acd6a456dfde349aa0bac7b6d2bdf9c0c995fff072898c6d8734f866c4")
API_KEY_I2V = os.getenv("WAVESPEED_API_KEY_I2V", "5a90eaa7ded95066c07adf55b91185a83abfa8db3fdc74d12ba5ad66db1d68fe")

# API endpoints
API_BASE_URL = "https://api.wavespeed.ai/api/v3"
T2V_ENDPOINT = f"{API_BASE_URL}/bytedance/seedance-v1-lite-t2v-480p"
I2V_ENDPOINT = f"{API_BASE_URL}/bytedance/seedance-v1-lite-i2v-480p"

# Aspect ratio options
ASPECT_RATIOS = {
    "16:9": "16:9 (YouTube, Standard Video)",
    "4:3": "4:3 (Traditional TV Format)",
    "1:1": "1:1 (Instagram Feed)",
    "3:4": "3:4 (Instagram Portrait)",
    "9:16": "9:16 (Instagram Reels, TikTok)",
    "21:9": "21:9 (Cinematic Wide)",
    "9:21": "9:21 (Ultra Vertical)"
}

# Default prompts
DEFAULT_TEXT_PROMPT = ""
DEFAULT_IMAGE_PROMPT = "Generate a video with smooth and natural movement. Objects should have visible motion while maintaining fluid transitions."

def add_watermark_cv2(input_video_path, output_video_path):
    """Add watermark to video using OpenCV"""
    if not VIDEO_PROCESSING_AVAILABLE:
        return False
    
    try:
        cap = cv2.VideoCapture(input_video_path)
        fps = int(cap.get(cv2.CAP_PROP_FPS))
        width = int(cap.get(cv2.CAP_PROP_FRAME_WIDTH))
        height = int(cap.get(cv2.CAP_PROP_FRAME_HEIGHT))
        
        fourcc = cv2.VideoWriter_fourcc(*'mp4v')
        out = cv2.VideoWriter(output_video_path, fourcc, fps, (width, height))
        
        watermark_text = "ginigen.com"
        font = cv2.FONT_HERSHEY_SIMPLEX
        font_scale = max(0.4, height * 0.001)
        font_thickness = max(1, int(height * 0.002))
        
        (text_width, text_height), baseline = cv2.getTextSize(watermark_text, font, font_scale, font_thickness)
        padding = int(width * 0.02)
        x = width - text_width - padding
        y = height - padding
        
        while True:
            ret, frame = cap.read()
            if not ret:
                break
            
            overlay = frame.copy()
            cv2.rectangle(overlay, 
                         (x - 5, y - text_height - 5), 
                         (x + text_width + 5, y + 5), 
                         (0, 0, 0), 
                         -1)
            frame = cv2.addWeighted(frame, 0.7, overlay, 0.3, 0)
            cv2.putText(frame, watermark_text, (x, y), font, font_scale, (255, 255, 255), font_thickness, cv2.LINE_AA)
            out.write(frame)
        
        cap.release()
        out.release()
        cv2.destroyAllWindows()
        return True
        
    except Exception as e:
        print(f"Watermark error: {str(e)}")
        return False

def add_watermark(input_video_path, output_video_path):
    """Add watermark to video"""
    if VIDEO_PROCESSING_AVAILABLE:
        success = add_watermark_cv2(input_video_path, output_video_path)
        if success:
            return True
    
    # Fallback - just copy without watermark
    try:
        import shutil
        shutil.copy2(input_video_path, output_video_path)
        return False
    except:
        return False

def update_prompt_placeholder(mode):
    """Update prompt placeholder based on mode"""
    if mode == "Text to Video":
        return gr.update(
            placeholder="Describe the video you want to create.\nExample: The sun rises slowly between tall buildings. [Ground-level follow shot] Bicycle tires roll over a dew-covered street at dawn.",
            value=""
        )
    else:
        return gr.update(
            placeholder="Describe how the image should move.\nExample: Camera slowly zooms in while clouds move across the sky. The subject's hair gently moves in the wind.",
            value=DEFAULT_IMAGE_PROMPT
        )

def update_image_input(mode):
    """Show/hide image input based on mode"""
    if mode == "Image to Video":
        # Show image input, hide aspect ratio for I2V
        return gr.update(visible=True), gr.update(visible=False)
    else:
        # Hide image input, show aspect ratio for T2V
        return gr.update(visible=False), gr.update(visible=True)

def poll_for_result(request_id, api_key, progress_callback=None):
    """Poll WaveSpeed API for video generation result"""
    url = f"{API_BASE_URL}/predictions/{request_id}/result"
    headers = {"Authorization": f"Bearer {api_key}"}
    
    start_time = time.time()
    while True:
        try:
            response = requests.get(url, headers=headers, timeout=30)
            
            if response.status_code == 200:
                result = response.json()["data"]
                status = result["status"]
                
                elapsed = time.time() - start_time
                if progress_callback:
                    progress_val = min(0.3 + (elapsed / 120) * 0.6, 0.9)
                    progress_callback(progress_val, desc=f"Processing... Status: {status} ({int(elapsed)}s)")
                
                if status == "completed":
                    video_url = result["outputs"][0]
                    return True, video_url
                elif status == "failed":
                    error_msg = result.get('error', 'Unknown error')
                    return False, f"Generation failed: {error_msg}"
                elif elapsed > 300:  # 5 minute timeout
                    return False, "Timeout: Generation took too long"
                
                # Continue polling
                time.sleep(2)
            else:
                return False, f"API Error: {response.status_code} - {response.text}"
                
        except Exception as e:
            return False, f"Connection error: {str(e)}"

def generate_video(mode, prompt, image_url, image_file, aspect_ratio, seed, api_key_override_t2v, api_key_override_i2v, progress=gr.Progress()):
    """Main video generation function using WaveSpeed API"""
    
    # Input validation
    if not prompt:
        return None, "❌ Please enter a prompt."
    
    if mode == "Image to Video":
        if not image_url and image_file is None:
            return None, "❌ Please provide an image URL or upload an image."
    
    try:
        progress(0, desc="Preparing request...")
        
        # Determine which API to use
        if mode == "Text to Video":
            api_key = api_key_override_t2v or API_KEY_T2V
            endpoint = T2V_ENDPOINT
            
            payload = {
                "aspect_ratio": aspect_ratio,
                "duration": 5,
                "prompt": prompt,
                "seed": seed if seed >= 0 else -1
            }
        else:  # Image to Video
            api_key = api_key_override_i2v or API_KEY_I2V
            endpoint = I2V_ENDPOINT
            
            # Handle image input
            if image_url:
                # Use provided URL directly
                final_image_url = image_url
            elif image_file is not None:
                # Convert PIL image to data URL
                progress(0.1, desc="Converting image to data URL...")
                
                # Convert to base64
                buffered = io.BytesIO()
                if isinstance(image_file, str):
                    with Image.open(image_file) as img:
                        img.save(buffered, format="PNG")
                else:
                    image_file.save(buffered, format="PNG")
                
                image_base64 = base64.b64encode(buffered.getvalue()).decode()
                
                # Try data URL format first
                final_image_url = f"data:image/png;base64,{image_base64}"
                
                # Note: If the API doesn't accept data URLs, you'll need to upload to a CDN
                # For now, we'll try the data URL and provide guidance if it fails
            else:
                return None, "❌ No image provided."
            
            payload = {
                "duration": 5,
                "image": final_image_url,
                "prompt": prompt,
                "seed": seed if seed >= 0 else -1
            }
        
        # Submit request
        progress(0.2, desc="Submitting request to WaveSpeed AI...")
        
        headers = {
            "Content-Type": "application/json",
            "Authorization": f"Bearer {api_key}"
        }
        
        response = requests.post(endpoint, headers=headers, data=json.dumps(payload), timeout=30)
        
        if response.status_code == 200:
            result = response.json()["data"]
            request_id = result["id"]
            progress(0.3, desc=f"Request submitted. ID: {request_id}")
        else:
            error_detail = response.text
            if mode == "Image to Video" and image_file is not None and not image_url:
                return None, f"""❌ API Error: {response.status_code}

The API may not accept base64 data URLs. Please try one of these options:
1. Use a direct image URL (e.g., https://example.com/image.jpg)
2. Upload your image to an image hosting service like:
   - imgur.com
   - imgbb.com
   - postimages.org
3. Use the image URL in the Image URL field

Error details: {error_detail}"""
            else:
                return None, f"❌ API Error: {response.status_code} - {error_detail}"
        
        # Poll for result
        success, result = poll_for_result(request_id, api_key, lambda p, desc: progress(p, desc=desc))
        
        if not success:
            return None, f"❌ {result}"
        
        video_url = result
        progress(0.9, desc="Downloading video...")
        
        # Download video
        video_response = requests.get(video_url, timeout=60)
        if video_response.status_code != 200:
            return None, f"❌ Failed to download video from {video_url}"
        
        video_data = video_response.content
        
        # Save to temporary file
        with tempfile.NamedTemporaryFile(delete=False, suffix='.mp4') as tmp_file:
            tmp_file.write(video_data)
            temp_video_path = tmp_file.name
        
        # Try to add watermark
        watermark_added = False
        final_video_path = temp_video_path
        
        if VIDEO_PROCESSING_AVAILABLE:
            progress(0.95, desc="Adding watermark...")
            final_video_path = tempfile.mktemp(suffix='.mp4')
            watermark_added = add_watermark(temp_video_path, final_video_path)
            
            if not watermark_added or not os.path.exists(final_video_path):
                final_video_path = temp_video_path
        
        # Save final video
        with open(final_video_path, "rb") as f:
            final_video_data = f.read()
        with open("output.mp4", "wb") as file:
            file.write(final_video_data)
        
        # Clean up temp files
        if temp_video_path != final_video_path and os.path.exists(temp_video_path):
            try:
                os.unlink(temp_video_path)
            except:
                pass
        
        progress(1.0, desc="Complete!")
        
        # Generation info
        watermark_status = "Added" if watermark_added else "Not available (cv2 not installed)" if not VIDEO_PROCESSING_AVAILABLE else "Failed"
        info = f"""✅ Video generated successfully!

📊 Generation Info:
- Mode: {mode}
- Aspect Ratio: {aspect_ratio}
- Seed: {seed}
- Duration: 5 seconds
- Resolution: 480p
- Watermark: {watermark_status}
- API: WaveSpeed AI
- Cost: $0.06
- File: output.mp4"""
        
        return final_video_path, info
        
    except requests.exceptions.Timeout:
        return None, "⏱️ Request timed out. Please try again."
    except Exception as e:
        return None, f"❌ Error occurred: {str(e)}"

# Gradio interface
with gr.Blocks(title="Bytedance Seedance Video Free", theme=gr.themes.Soft()) as app:
    gr.Markdown("""
    # 🎬 Bytedance Seedance Video' Free
    
    Generate videos from text or images using **WaveSpeed AI API**.
    
    [![Powered by Ginigen](https://img.shields.io/badge/Powered%20by-WaveSpeed%20AI-blue)](https://ginigen.com/)
    
    ⚠️ **Note**: Each generation costs $0.06
    """)
    
    with gr.Row():
        with gr.Column(scale=1):
            # API Settings
            with gr.Accordion("⚙️ API Settings", open=False):
                gr.Markdown("""
                API keys are loaded from environment variables:
                - `WS_API_KEY_T2V` for Text-to-Video
                - `WS_API_KEY_I2V` for Image-to-Video
                
                You can override them below if needed.
                """)
                
                api_key_override_t2v = gr.Textbox(
                    label="Text-to-Video API Key (Optional Override)",
                    type="password",
                    placeholder="Leave empty to use environment variable",
                    value=""
                )
                
                api_key_override_i2v = gr.Textbox(
                    label="Image-to-Video API Key (Optional Override)",
                    type="password",
                    placeholder="Leave empty to use environment variable",
                    value=""
                )
            
            # Generation mode
            mode = gr.Radio(
                label="🎯 Generation Mode",
                choices=["Text to Video", "Image to Video"],
                value="Text to Video"
            )
            
            # Image input - URL or file
            with gr.Column(visible=False) as image_input_group:
                gr.Markdown("### Image Input")
                image_url_input = gr.Textbox(
                    label="📷 Image URL",
                    placeholder="https://example.com/image.jpg",
                    info="Enter a direct image URL"
                )
                gr.Markdown("**OR**")
                image_file_input = gr.Image(
                    label="📤 Upload Image (Beta) - Converted to data URL (may not work)",
                    type="pil"
                )
            
            # Aspect ratio (only for T2V)
            aspect_ratio = gr.Dropdown(
                label="📐 Aspect Ratio (Text to Video only)",
                choices=list(ASPECT_RATIOS.keys()),
                value="16:9",
                info="Choose ratio optimized for social media platforms",
                visible=True
            )
            
            # Ratio description
            ratio_info = gr.Markdown(value=f"Selected ratio: {ASPECT_RATIOS['16:9']}")
            
            # Seed setting
            seed = gr.Number(
                label="🎲 Random Seed",
                value=-1,
                precision=0,
                info="Use -1 for random, or set a specific value for reproducible results"
            )
            
            # Fixed settings display
            watermark_info = "ginigen.com" if VIDEO_PROCESSING_AVAILABLE else "ginigen.com (requires cv2)"
            gr.Markdown(f"""
            ### 📋 Fixed Settings
            - **Duration**: 5 seconds
            - **Resolution**: 480p
            - **Cost**: $0.06 per video
            - **Watermark**: {watermark_info}
            """)
        
        with gr.Column(scale=2):
            # Prompt input
            prompt = gr.Textbox(
                label="✍️ Prompt",
                lines=5,
                placeholder="Describe the video you want to create.\nExample: The sun rises slowly between tall buildings. [Ground-level follow shot] Bicycle tires roll over a dew-covered street at dawn.",
                value=""
            )
            
            # Generate button
            generate_btn = gr.Button("🎬 Generate Video ($0.06)", variant="primary", size="lg")
            
            # Results display
            with gr.Column():
                output_video = gr.Video(
                    label="📹 Generated Video",
                    autoplay=True
                )
                output_info = gr.Textbox(
                    label="Information",
                    lines=10,
                    interactive=False
                )
    
    # Usage instructions
    with gr.Accordion("📖 How to Use", open=False):
        gr.Markdown("""
        ### Installation
        
        1. **Install required packages**:
        ```bash
        pip install gradio requests pillow
        ```
        
        2. **For watermark support (optional)**:
        ```bash
        pip install opencv-python
        ```
        
        3. **Set environment variables**:
        ```bash
        export WS_API_KEY_T2V="your-t2v-api-key"
        export WS_API_KEY_I2V="your-i2v-api-key"
        ```
        
        4. **Run**:
        ```bash
        python app.py
        ```
        
        ### Features
        
        - **Text to Video**: Generate video from text description with aspect ratio selection
        - **Image to Video**: Transform image into animated video
          - Option 1: Provide direct image URL (recommended)
          - Option 2: Upload image file (converted to data URL - may not work)
        - **Aspect Ratios**: Available for Text to Video only
        - **Seed Value**: Use -1 for random or set specific value for reproducible results
        - **Watermark**: Automatically adds "ginigen.com" watermark (requires opencv-python)
        
        ### Image to Video Tips
        
        For best results with Image to Video:
        1. Use direct image URLs (https://...)
        2. If uploading files doesn't work, upload your image to:
           - [imgur.com](https://imgur.com)
           - [imgbb.com](https://imgbb.com)
           - [postimages.org](https://postimages.org)
        3. Copy the direct image URL and paste it in the Image URL field
        
        ### API Information
        
        - **Provider**: WaveSpeed AI
        - **Models**: ByteDance Seedance v1 Lite
        - **Cost**: $0.06 per 5-second video
        - **Resolution**: 480p
        
        ### Prompt Writing Tips
        
        - Use specific and detailed descriptions
        - Specify camera movements (e.g., zoom in, pan left, tracking shot)
        - Describe lighting and atmosphere (e.g., golden hour, dramatic lighting)
        - Indicate movement speed (e.g., slowly, rapidly, gently)
        """)
    
    # Examples
    gr.Examples(
        examples=[
            ["Text to Video", "A cat walking gracefully across a sunlit room", "", None, "16:9", -1],
            ["Text to Video", "A serene lake at sunrise with mist rolling over the water. Camera slowly pans across the landscape as birds fly overhead.", "", None, "16:9", 42],
            ["Text to Video", "Urban street scene at night with neon lights reflecting on wet pavement. People walking with umbrellas, camera tracking forward.", "", None, "9:16", 123],
            ["Image to Video", "The camera slowly zooms in while clouds drift across the sky", "https://images.unsplash.com/photo-1506905925346-21bda4d32df4", None, "16:9", -1],
        ],
        inputs=[mode, prompt, image_url_input, image_file_input, aspect_ratio, seed],
        label="Example Prompts"
    )
    
    # Event handlers
    mode.change(
        fn=update_prompt_placeholder,
        inputs=[mode],
        outputs=[prompt]
    )
    
    mode.change(
        fn=update_image_input,
        inputs=[mode],
        outputs=[image_input_group, aspect_ratio]
    )
    
    aspect_ratio.change(
        fn=lambda x: f"Selected ratio: {ASPECT_RATIOS[x]}",
        inputs=[aspect_ratio],
        outputs=[ratio_info]
    )
    
    generate_btn.click(
        fn=generate_video,
        inputs=[mode, prompt, image_url_input, image_file_input, aspect_ratio, seed, api_key_override_t2v, api_key_override_i2v],
        outputs=[output_video, output_info]
    )

# Run app
if __name__ == "__main__":
    app.launch(
        server_name="0.0.0.0",
        server_port=7860,
        share=False,
        inbrowser=True
    )