Spaces:

ginigen
/

Seedance-Free

Running

File size: 19,630 Bytes

dc72519
 
 
 
 
 
239e0d9
dc72519
239e0d9
dc72519
9f85f32
239e0d9
dc72519
 
239e0d9
3558e0d
8f84113
 
 
 
 
 
 
 
 
239e0d9
a5e046f
239e0d9
8f84113
 
239e0d9
a5e046f
dc72519
a5e046f
 
 
 
 
 
 
dc72519
 
3558e0d
 
 
 
8f84113
 
 
 
 
9f85f32
8f84113
 
9f85f32
8f84113
 
 
 
9f85f32
8f84113
 
 
9f85f32
8f84113
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
9f85f32
8f84113
 
 
 
9f85f32
 
8f84113
9f85f32
 
8f84113
 
 
 
 
9f85f32
 
 
8f84113
 
 
 
 
 
 
 
 
 
 
 
 
9f85f32
dc72519
a5e046f
 
3558e0d
 
 
 
239e0d9
3558e0d
 
 
 
dc72519
 
a5e046f
 
dc72519
 
 
 
2504a64
3558e0d
 
 
 
2504a64
3558e0d
 
 
 
 
 
 
 
 
 
dc72519
a5e046f
239e0d9
a5e046f
dc72519
 
a5e046f
239e0d9
dc72519
239e0d9
a5e046f
dc72519
a5e046f
239e0d9
a5e046f
 
239e0d9
dc72519
a5e046f
239e0d9
a5e046f
dc72519
 
 
 
 
 
 
 
a5e046f
 
 
dc72519
a5e046f
 
dc72519
 
 
 
a5e046f
dc72519
 
 
239e0d9
dc72519
 
3558e0d
dc72519
2504a64
 
dc72519
3558e0d
2504a64
3558e0d
 
 
 
 
 
 
2504a64
 
3558e0d
 
2504a64
3558e0d
 
2504a64
 
 
 
 
3558e0d
2504a64
 
 
 
 
 
 
 
 
 
3558e0d
2504a64
 
 
3558e0d
 
2504a64
 
 
 
 
 
 
3558e0d
 
 
 
2504a64
3558e0d
 
 
 
 
 
 
 
2504a64
 
 
 
a5e046f
dc72519
a5e046f
dc72519
 
 
3558e0d
 
dc72519
 
a5e046f
dc72519
 
9f85f32
 
8f84113
 
 
9f85f32
8f84113
 
 
 
 
 
 
dc72519
8f84113
 
 
 
 
9f85f32
8f84113
9f85f32
8f84113
 
 
 
dc72519
a5e046f
dc72519
a5e046f
8f84113
a5e046f
239e0d9
a5e046f
 
 
dc72519
a5e046f
 
8f84113
a5e046f
dc72519
9f85f32
dc72519
3558e0d
 
dc72519
a5e046f
3558e0d
 
dc72519
 
a5e046f
 
dc72519
a5e046f
239e0d9
a5e046f
239e0d9
ac825a1
dc72519
 
 
 
a5e046f
 
dc72519
a5e046f
dc72519
a5e046f
dc72519
a5e046f
dc72519
 
 
a5e046f
dc72519
a5e046f
dc72519
a5e046f
dc72519
 
239e0d9
a5e046f
dc72519
a5e046f
 
 
239e0d9
 
a5e046f
dc72519
a5e046f
dc72519
 
 
239e0d9
a5e046f
dc72519
a5e046f
dc72519
 
a5e046f
dc72519
239e0d9
a5e046f
 
239e0d9
a5e046f
dc72519
a5e046f
dc72519
 
a5e046f
dc72519
239e0d9
a5e046f
8f84113
 
a5e046f
 
 
8f84113
dc72519
 
 
a5e046f
dc72519
a5e046f
dc72519
3558e0d
 
dc72519
239e0d9
a5e046f
 
239e0d9
a5e046f
dc72519
 
a5e046f
dc72519
 
 
a5e046f
dc72519
 
239e0d9
 
a5e046f
 
dc72519
a5e046f
dc72519
a5e046f
dc72519
8f84113
 
 
 
 
 
dc72519
 
8f84113
dc72519
 
 
 
8f84113
dc72519
 
 
 
a5e046f
dc72519
a5e046f
 
 
 
8f84113
dc72519
a5e046f
dc72519
a5e046f
 
 
 
3558e0d
 
 
 
 
 
8f84113
dc72519
239e0d9
a5e046f
dc72519
 
a5e046f
 
 
dc72519
 
a5e046f
dc72519
239e0d9
a5e046f
dc72519
 
 
 
 
239e0d9
dc72519
 
 
 
 
239e0d9
dc72519
a5e046f
dc72519
 
 
239e0d9
dc72519
 
 
 
 
239e0d9
a5e046f
dc72519

#!/usr/bin/env python3
"""
AI Video Generator with Gradio
Single file application - app.py
"""

import os
import gradio as gr
import replicate
import base64
from PIL import Image, ImageDraw, ImageFont
import io
import requests
from datetime import datetime
import tempfile
import time

# Try to import video processing libraries
try:
    import cv2
    import numpy as np
    VIDEO_PROCESSING_AVAILABLE = True
except ImportError:
    VIDEO_PROCESSING_AVAILABLE = False
    print("Warning: cv2 not available. Watermark feature will be disabled.")

# API token setup
api_token = os.getenv("RAPI_TOKEN")
if api_token:
    os.environ["REPLICATE_API_TOKEN"] = api_token

# Aspect ratio options
ASPECT_RATIOS = {
    "16:9": "16:9 (YouTube, Standard Video)",
    "4:3": "4:3 (Traditional TV Format)",
    "1:1": "1:1 (Instagram Feed)",
    "3:4": "3:4 (Instagram Portrait)",
    "9:16": "9:16 (Instagram Reels, TikTok)",
    "21:9": "21:9 (Cinematic Wide)",
    "9:21": "9:21 (Ultra Vertical)"
}

# Default prompts
DEFAULT_TEXT_PROMPT = ""
DEFAULT_IMAGE_PROMPT = "Generate a video with smooth and natural movement. Objects should have visible motion while maintaining fluid transitions."

def add_watermark_cv2(input_video_path, output_video_path):
    """Add watermark to video using OpenCV"""
    if not VIDEO_PROCESSING_AVAILABLE:
        return False
    
    try:
        # Open the video
        cap = cv2.VideoCapture(input_video_path)
        
        # Get video properties
        fps = int(cap.get(cv2.CAP_PROP_FPS))
        width = int(cap.get(cv2.CAP_PROP_FRAME_WIDTH))
        height = int(cap.get(cv2.CAP_PROP_FRAME_HEIGHT))
        
        # Define codec and create VideoWriter
        fourcc = cv2.VideoWriter_fourcc(*'mp4v')
        out = cv2.VideoWriter(output_video_path, fourcc, fps, (width, height))
        
        # Watermark settings
        watermark_text = "ginigen.com"
        font = cv2.FONT_HERSHEY_SIMPLEX
        font_scale = max(0.4, height * 0.001)  # Scale based on video height
        font_thickness = max(1, int(height * 0.002))
        
        # Get text size
        (text_width, text_height), baseline = cv2.getTextSize(watermark_text, font, font_scale, font_thickness)
        
        # Position (bottom right with padding)
        padding = int(width * 0.02)
        x = width - text_width - padding
        y = height - padding
        
        # Process each frame
        while True:
            ret, frame = cap.read()
            if not ret:
                break
            
            # Add semi-transparent background for text
            overlay = frame.copy()
            cv2.rectangle(overlay, 
                         (x - 5, y - text_height - 5), 
                         (x + text_width + 5, y + 5), 
                         (0, 0, 0), 
                         -1)
            frame = cv2.addWeighted(frame, 0.7, overlay, 0.3, 0)
            
            # Add text
            cv2.putText(frame, watermark_text, (x, y), font, font_scale, (255, 255, 255), font_thickness, cv2.LINE_AA)
            
            # Write frame
            out.write(frame)
        
        # Release everything
        cap.release()
        out.release()
        cv2.destroyAllWindows()
        
        return True
        
    except Exception as e:
        print(f"Watermark error: {str(e)}")
        return False

def add_watermark_simple(input_video_path, output_video_path):
    """Simple fallback - just copy the video without watermark"""
    try:
        import shutil
        shutil.copy2(input_video_path, output_video_path)
        return False
    except Exception as e:
        print(f"Copy error: {str(e)}")
        return False

def add_watermark(input_video_path, output_video_path):
    """Add watermark to video - tries cv2 first, then fallback"""
    if VIDEO_PROCESSING_AVAILABLE:
        success = add_watermark_cv2(input_video_path, output_video_path)
        if success:
            return True
    
    # Fallback - just copy without watermark
    return add_watermark_simple(input_video_path, output_video_path)

def update_prompt_placeholder(mode):
    """Update prompt placeholder based on mode"""
    if mode == "Text to Video":
        return gr.update(
            placeholder="Describe the video you want to create.\nExample: The sun rises slowly between tall buildings. [Ground-level follow shot] Bicycle tires roll over a dew-covered street at dawn.",
            value=""
        )
    else:
        return gr.update(
            placeholder="Describe how the image should move.\nExample: Camera slowly zooms in while clouds move across the sky. The subject's hair gently moves in the wind.",
            value=DEFAULT_IMAGE_PROMPT
        )

def update_image_input(mode):
    """Show/hide image input based on mode"""
    if mode == "Image to Video":
        return gr.update(visible=True)
    else:
        return gr.update(visible=False)

def wait_for_model_with_retry(model_name, max_retries=5, initial_wait=10):
    """Wait for model to be ready with retry logic"""
    for attempt in range(max_retries):
        try:
            # Try to get model info
            model = replicate.models.get(model_name)
            return True
        except Exception as e:
            if attempt < max_retries - 1:
                wait_time = initial_wait * (attempt + 1)
                print(f"Model not ready, waiting {wait_time} seconds... (Attempt {attempt + 1}/{max_retries})")
                time.sleep(wait_time)
            else:
                return False
    return False

def generate_video(mode, prompt, image, aspect_ratio, seed, api_key_input, progress=gr.Progress()):
    """Main video generation function"""
    
    # API token check
    token = api_key_input or api_token
    if not token:
        return None, "❌ API token required. Please set RAPI_TOKEN environment variable or enter your API key."
    
    os.environ["REPLICATE_API_TOKEN"] = token
    
    # Input validation
    if not prompt:
        return None, "❌ Please enter a prompt."
    
    if mode == "Image to Video" and image is None:
        return None, "❌ Please upload an image."
    
    try:
        progress(0, desc="Preparing video generation...")
        
        # Input parameters setup
        input_params = {
            "prompt": prompt,
            "duration": 5,
            "resolution": "480p",
            "aspect_ratio": aspect_ratio,
            "seed": seed
        }
        
        # Image to video mode
        if mode == "Image to Video" and image is not None:
            progress(0.1, desc="Processing image...")
            
            # Convert PIL Image to base64
            if isinstance(image, str):  # File path
                with Image.open(image) as img:
                    buffered = io.BytesIO()
                    img.save(buffered, format="PNG")
                    image_base64 = base64.b64encode(buffered.getvalue()).decode()
            else:  # PIL Image object
                buffered = io.BytesIO()
                image.save(buffered, format="PNG")
                image_base64 = base64.b64encode(buffered.getvalue()).decode()
            
            input_params["image"] = f"data:image/png;base64,{image_base64}"
        
        progress(0.2, desc="Checking model availability...")
        
        # Set up Replicate with the API token
        replicate.api_token = token
        
        # Wait for model to be ready
        model_ready = wait_for_model_with_retry("bytedance/seedance-1-lite")
        if not model_ready:
            return None, "⏳ Model is still booting up. Please try again in a few minutes."
        
        progress(0.3, desc="Calling Replicate API...")
        
        # Run Replicate with retry logic
        max_attempts = 3
        output = None
        
        for attempt in range(max_attempts):
            try:
                # Run Replicate - use the model directly without version specifier
                start_time = time.time()
                
                # Create a generator for progress tracking
                output_generator = replicate.run(
                    "bytedance/seedance-1-lite",
                    input=input_params
                )
                
                # If it's a generator, iterate through it
                if hasattr(output_generator, '__iter__') and not isinstance(output_generator, (str, bytes)):
                    for event in output_generator:
                        elapsed = time.time() - start_time
                        progress_val = min(0.3 + (elapsed / 300) * 0.4, 0.7)
                        progress(progress_val, desc=f"Generating video... ({int(elapsed)}s)")
                        output = event  # Keep the last event as output
                else:
                    # If it's not a generator, use it directly
                    output = output_generator
                
                # If we got output, break the retry loop
                if output:
                    break
                
            except replicate.exceptions.ReplicateError as e:
                error_str = str(e)
                if "cold boot" in error_str.lower() or "starting" in error_str.lower():
                    if attempt < max_attempts - 1:
                        progress(0.3, desc=f"Model is starting up, retrying... (Attempt {attempt + 2}/{max_attempts})")
                        time.sleep(30)
                        continue
                elif "timeout" in error_str.lower() and attempt < max_attempts - 1:
                    progress(0.3, desc=f"Timeout occurred, retrying... (Attempt {attempt + 2}/{max_attempts})")
                    time.sleep(10)
                    continue
                else:
                    return None, f"❌ Replicate API error: {error_str}"
            except Exception as e:
                if attempt < max_attempts - 1:
                    progress(0.3, desc=f"Error occurred, retrying... (Attempt {attempt + 2}/{max_attempts})")
                    time.sleep(5)
                    continue
                else:
                    return None, f"❌ Unexpected error: {str(e)}"
        
        # Check if we got output
        if not output:
            return None, "❌ Failed to generate video after multiple attempts."
        
        progress(0.7, desc="Downloading video...")
        
        # Get video data
        if hasattr(output, 'read'):
            video_data = output.read()
        else:
            # Download from URL with timeout
            response = requests.get(output, timeout=60)
            video_data = response.content
        
        # Save to temporary file
        with tempfile.NamedTemporaryFile(delete=False, suffix='.mp4') as tmp_file:
            tmp_file.write(video_data)
            temp_video_path = tmp_file.name
        
        # Try to add watermark
        watermark_added = False
        final_video_path = temp_video_path
        
        if VIDEO_PROCESSING_AVAILABLE:
            progress(0.8, desc="Adding watermark...")
            final_video_path = tempfile.mktemp(suffix='.mp4')
            watermark_added = add_watermark(temp_video_path, final_video_path)
            
            if not watermark_added or not os.path.exists(final_video_path):
                final_video_path = temp_video_path
        
        # Save final video
        with open(final_video_path, "rb") as f:
            final_video_data = f.read()
        with open("output.mp4", "wb") as file:
            file.write(final_video_data)
        
        # Clean up temp files
        if temp_video_path != final_video_path and os.path.exists(temp_video_path):
            try:
                os.unlink(temp_video_path)
            except:
                pass
        
        progress(1.0, desc="Complete!")
        
        # Generation info
        watermark_status = "Added" if watermark_added else "Not available (cv2 not installed)" if not VIDEO_PROCESSING_AVAILABLE else "Failed"
        info = f"""✅ Video generated successfully!

📊 Generation Info:
- Mode: {mode}
- Aspect Ratio: {aspect_ratio}
- Seed: {seed}
- Duration: 5 seconds
- Resolution: 480p
- Watermark: {watermark_status}
- File: output.mp4"""
        
        return final_video_path, info
        
    except requests.exceptions.Timeout:
        return None, "⏱️ Request timed out. The server might be under heavy load. Please try again in a few minutes."
    except Exception as e:
        error_msg = f"❌ Error occurred: {str(e)}"
        if "timeout" in str(e).lower():
            error_msg += "\n\n💡 Tip: The model might be cold starting. Please wait a minute and try again."
        return None, error_msg

# Gradio interface
with gr.Blocks(title="Bytedance Seedance Video Free", theme=gr.themes.Soft()) as app:
    gr.Markdown("""
    # 🎬 Bytedance Seedance Video' Free
    
    Generate videos from text or images using **Replicate API**.
    
    [![Powered by Ginigen](https://img.shields.io/badge/Powered%20by-Replicate-blue)](https://ginigen.com/)
    """)
    
    with gr.Row():
        with gr.Column(scale=1):
            # API Settings
            with gr.Accordion("⚙️ API Settings", open=not bool(api_token)):
                if api_token:
                    gr.Markdown("✅ API token loaded from environment variable.")
                    api_key_input = gr.Textbox(
                        label="Replicate API Token (Optional)",
                        type="password",
                        placeholder="Enter to override environment variable",
                        value=""
                    )
                else:
                    gr.Markdown("⚠️ RAPI_TOKEN environment variable not set.")
                    api_key_input = gr.Textbox(
                        label="Replicate API Token (Required)",
                        type="password",
                        placeholder="Enter your Replicate API token",
                        value=""
                    )
            
            # Generation mode
            mode = gr.Radio(
                label="🎯 Generation Mode",
                choices=["Text to Video", "Image to Video"],
                value="Text to Video"
            )
            
            # Image upload
            image_input = gr.Image(
                label="📷 Upload Image",
                type="pil",
                visible=False
            )
            
            # Aspect ratio
            aspect_ratio = gr.Dropdown(
                label="📐 Aspect Ratio",
                choices=list(ASPECT_RATIOS.keys()),
                value="16:9",
                info="Choose ratio optimized for social media platforms"
            )
            
            # Ratio description
            ratio_info = gr.Markdown(value=f"Selected ratio: {ASPECT_RATIOS['16:9']}")
            
            # Seed setting
            seed = gr.Number(
                label="🎲 Random Seed",
                value=42,
                precision=0,
                info="Use same seed value to reproduce same results"
            )
            
            # Fixed settings display
            watermark_info = "ginigen.com" if VIDEO_PROCESSING_AVAILABLE else "ginigen.com (requires cv2)"
            gr.Markdown(f"""
            ### 📋 Fixed Settings
            - **Duration**: 5 seconds
            - **Resolution**: 480p
            - **Watermark**: {watermark_info}
            """)
        
        with gr.Column(scale=2):
            # Prompt input
            prompt = gr.Textbox(
                label="✍️ Prompt",
                lines=5,
                placeholder="Describe the video you want to create.\nExample: The sun rises slowly between tall buildings. [Ground-level follow shot] Bicycle tires roll over a dew-covered street at dawn.",
                value=""
            )
            
            # Generate button
            generate_btn = gr.Button("🎬 Generate Video", variant="primary", size="lg")
            
            # Results display
            with gr.Column():
                output_video = gr.Video(
                    label="📹 Generated Video",
                    autoplay=True
                )
                output_info = gr.Textbox(
                    label="Information",
                    lines=8,
                    interactive=False
                )
    
    # Usage instructions
    with gr.Accordion("📖 How to Use", open=False):
        gr.Markdown("""
        ### Installation
        
        1. **Install required packages**:
        ```bash
        pip install gradio replicate pillow requests
        ```
        
        2. **For watermark support (optional)**:
        ```bash
        pip install opencv-python
        ```
        
        3. **Set environment variable** (optional):
        ```bash
        export RAPI_TOKEN="your-replicate-api-token"
        ```
        
        4. **Run**:
        ```bash
        python app.py
        ```
        
        ### Features
        
        - **Text to Video**: Generate video from text description only
        - **Image to Video**: Transform uploaded image into animated video
        - **Aspect Ratios**: Choose ratios optimized for various social media platforms
        - **Seed Value**: Use same seed to reproduce identical results
        - **Watermark**: Automatically adds "ginigen.com" watermark (requires opencv-python)
        
        ### Prompt Writing Tips
        
        - Use specific and detailed descriptions
        - Specify camera movements (e.g., zoom in, pan left, tracking shot)
        - Describe lighting and atmosphere (e.g., golden hour, dramatic lighting)
        - Indicate movement speed (e.g., slowly, rapidly, gently)
        
        ### Troubleshooting
        
        - **Timeout errors**: The model might be cold starting. Wait 1-2 minutes and try again.
        - **Model booting**: First requests after inactivity may take longer as the model boots up.
        - **Extended wait times**: Complex prompts or server load may cause longer generation times.
        - **Watermark not showing**: Install opencv-python for watermark support.
        """)
    
    # Examples
    gr.Examples(
        examples=[
            ["Text to Video", "A serene lake at sunrise with mist rolling over the water. Camera slowly pans across the landscape as birds fly overhead.", None, "16:9", 42],
            ["Text to Video", "Urban street scene at night with neon lights reflecting on wet pavement. People walking with umbrellas, camera tracking forward.", None, "9:16", 123],
            ["Text to Video", "Close-up of a flower blooming in time-lapse, soft natural lighting, shallow depth of field.", None, "1:1", 789],
        ],
        inputs=[mode, prompt, image_input, aspect_ratio, seed],
        label="Example Prompts"
    )
    
    # Event handlers
    mode.change(
        fn=update_prompt_placeholder,
        inputs=[mode],
        outputs=[prompt]
    )
    
    mode.change(
        fn=update_image_input,
        inputs=[mode],
        outputs=[image_input]
    )
    
    aspect_ratio.change(
        fn=lambda x: f"Selected ratio: {ASPECT_RATIOS[x]}",
        inputs=[aspect_ratio],
        outputs=[ratio_info]
    )
    
    generate_btn.click(
        fn=generate_video,
        inputs=[mode, prompt, image_input, aspect_ratio, seed, api_key_input],
        outputs=[output_video, output_info]
    )

# Run app
if __name__ == "__main__":
    app.launch(
        server_name="0.0.0.0",
        server_port=7860,
        share=False,
        inbrowser=True
    )