Spaces:

testdeep123
/

video

Build error

App Files Files Community

testdeep123 commited on Apr 11

Commit

59b7f47

verified ·

1 Parent(s): c760fa6

Update app.py

Browse files

Files changed (1) hide show

app.py +651 -862

app.py CHANGED Viewed

@@ -1,1085 +1,874 @@
 import os
-import shutil # Added for directory cleanup
-import requests
-import io
-import time
-import re
 import random
-import tempfile # Added for use in create_clip
-import math
 import cv2
 import numpy as np
-import soundfile as sf
-import torch
-import gradio as gr
-import pysrt
 from bs4 import BeautifulSoup
 from urllib.parse import quote
-from PIL import Image, ImageDraw, ImageFont
 from gtts import gTTS
-from pydub import AudioSegment
-from pydub.generators import Sine
-# Import moviepy components correctly
-try:
-    from moviepy.editor import (
-        VideoFileClip, AudioFileClip, ImageClip, concatenate_videoclips,
-        CompositeVideoClip, TextClip, CompositeAudioClip
-    )
-    import moviepy.video.fx.all as vfx
-    import moviepy.config as mpy_config
-    # Set ImageMagick binary (adjust path if necessary for your environment)
-    # Check if ImageMagick is available, otherwise TextClip might fail
-    try:
-        # Attempt to find ImageMagick automatically or use a common path
-        # If running locally, ensure ImageMagick is installed and in your PATH
-        # If on Hugging Face Spaces, add 'imagemagick' to a packages.txt file
-        mpy_config.change_settings({"IMAGEMAGICK_BINARY": "/usr/bin/convert"}) # Common Linux path
-        print("ImageMagick path set.")
-        # You might need to verify this path works in your specific deployment environment
-    except Exception as e:
-        print(f"Warning: Could not configure ImageMagick path. TextClip might fail. Error: {e}")
-        # Consider adding a fallback or disabling text if ImageMagick is essential and not found
-except ImportError:
-    print("Error: moviepy library not found. Please install it using 'pip install moviepy'.")
-    # Optionally, exit or raise a more specific error if moviepy is critical
-    exit() # Exit if moviepy is absolutely required
-# Import Kokoro (ensure it's installed)
-try:
-    from kokoro import KPipeline
-    # Initialize Kokoro TTS pipeline
-    # Using 'en' as a placeholder, adjust 'a' if it was intentional and valid for Kokoro
-    pipeline = KPipeline(lang_code='en')
-    print("Kokoro Pipeline Initialized.")
-except ImportError:
-    print("Warning: Kokoro library not found. TTS generation will rely solely on gTTS.")
-    pipeline = None
-except Exception as e:
-    print(f"Warning: Failed to initialize Kokoro Pipeline. TTS generation will rely solely on gTTS. Error: {e}")
-    pipeline = None
-# Global Configuration
-# --- IMPORTANT: Replace placeholders with your actual keys or use environment variables ---
-PEXELS_API_KEY = os.getenv('PEXELS_API_KEY', 'YOUR_PEXELS_API_KEY_HERE') # Use environment variable or replace
-OPENROUTER_API_KEY = os.getenv('OPENROUTER_API_KEY', 'YOUR_OPENROUTER_API_KEY_HERE') # Use environment variable or replace
-# --- ---
-if PEXELS_API_KEY == 'YOUR_PEXELS_API_KEY_HERE' or OPENROUTER_API_KEY == 'YOUR_OPENROUTER_API_KEY_HERE':
-    print("\n*** WARNING: API keys are not set. Please set PEXELS_API_KEY and OPENROUTER_API_KEY environment variables or replace the placeholders in the script. ***\n")
-OPENROUTER_MODEL = "mistralai/mistral-small-3.1-24b-instruct:free" # Or choose another model
-TEMP_FOLDER = "temp_video_processing"
 OUTPUT_VIDEO_FILENAME = "final_video.mp4"
 USER_AGENT = "Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/91.0.4472.124 Safari/537.36"
-BACKGROUND_MUSIC_PATH = "background_music.mp3" # Ensure this file exists
-# --- Global variables to be set by Gradio input ---
-TARGET_RESOLUTION = (1920, 1080) # Default, will be updated
-CAPTION_COLOR = "white" # Default, will be updated
-# Helper Functions
 def generate_script(user_input):
-    """Generates a script using the OpenRouter API based on user input."""
-    if not OPENROUTER_API_KEY or OPENROUTER_API_KEY == 'YOUR_OPENROUTER_API_KEY_HERE':
-        print("Error: OpenRouter API Key not configured.")
-        return None
     headers = {
         'Authorization': f'Bearer {OPENROUTER_API_KEY}',
-        'HTTP-Referer': 'https://your-app-name.hf.space', # Optional: Replace with your app's URL if deployed
-        'X-Title': 'AI Documentary Maker' # Optional
     }
-    # Updated prompt based on original instructions
-    prompt = f"""Short Documentary Script Generator Instructions:
 If I say "use this," just output the script exactly as I gave it.
 If I only give topics, generate a script based on them.
-If I provide a full script, rewrite it without any changes.
-Make everything short, simple, humorous, funny, and act serious but humorous.
-Don't say anything off-topic.
-Always include a funny statement to subscribe based on the video topic at the end.
-Use normal conversational text like a normal person talking, avoid AI phrases, make statements humanized and normal conversational.
-Always talk negative views, don't really want any positive statements.
-The full script will be one video about one topic, so keep that in mind.
 Formatting Rules:
-Title in Square Brackets: Each section starts with a one-word title inside [ ] (max two words if necessary). This title will be used as a search term for Pexels footage.
-Casual & Funny Narration: Each section has 5-15 words of narration. Keep it natural, funny, and unpredictable (not robotic, poetic, or rhythmic).
-No Special Formatting: No bold, italics, or special characters. You are an assistant AI; your task is to create the script. You aren't a chatbot. So, don't write extra text.
-Generalized Search Terms: If a term is too specific, make it more general for Pexels search.
-Scene-Specific Writing: Each section describes only what should be shown in the video.
-Output Only the Script: No extra text, just the script.
 Example Output:
 [North Korea]
-Top 5 unknown facts about North Korea, maybe.
 [Invisibility]
-North Korea’s internet speed is so fast… it’s basically dial-up from 1998.
 [Leadership]
-Kim Jong-un once won an election with 100% votes… because who would vote against him?
 [Magic]
-North Korea discovered unicorns. They're delicious, apparently.
 [Warning]
-Subscribe now, or Kim Jong-un might send you a strongly worded letter.
 [Freedom]
-North Korean citizens enjoy unparalleled freedom... to agree with the government.
-Now here is the Topic/script: {user_input}
 """
     data = {
         'model': OPENROUTER_MODEL,
         'messages': [{'role': 'user', 'content': prompt}],
-        'temperature': 0.5, # Slightly increased for more variety in humor
-        'max_tokens': 1000 # Reduced slightly, adjust if scripts get cut off
     }
     try:
         response = requests.post(
             'https://openrouter.ai/api/v1/chat/completions',
             headers=headers,
             json=data,
-            timeout=45 # Increased timeout
         )
-        response.raise_for_status() # Raise an exception for bad status codes (4xx or 5xx)
-        response_data = response.json()
-        if 'choices' in response_data and len(response_data['choices']) > 0:
-            script_content = response_data['choices'][0]['message']['content']
-            # Basic cleaning: remove potential preamble/postamble if the model adds it
-            script_content = re.sub(r'^.*?\n*\[', '[', script_content, flags=re.DOTALL) # Remove text before first bracket
-            script_content = script_content.strip()
-            print(f"Generated Script:\n{script_content}") # Log the script
-            return script_content
         else:
-            print(f"Error: No choices found in OpenRouter response. Response: {response_data}")
             return None
-    except requests.exceptions.RequestException as e:
-        print(f"Error calling OpenRouter API: {e}")
-        return None
     except Exception as e:
-        print(f"An unexpected error occurred during script generation: {e}")
         return None
 def parse_script(script_text):
-    """Parses the generated script text into structured elements."""
-    if not script_text:
-        return []
     sections = {}
     current_title = None
     current_text = ""
     try:
         for line in script_text.splitlines():
             line = line.strip()
-            if not line: # Skip empty lines
-                continue
-            match = re.match(r'^\[([^\]]+)\](.*)', line)
-            if match:
-                # If a title was being processed, save it
-                if current_title is not None and current_text:
-                    sections[current_title] = current_text.strip()
-                current_title = match.group(1).strip()
-                current_text = match.group(2).strip()
-            elif current_title: # Append to the text of the current title
-                current_text += " " + line # Add space between lines
-        # Save the last section
-        if current_title is not None and current_text:
             sections[current_title] = current_text.strip()
         elements = []
-        if not sections:
-             print("Warning: Script parsing resulted in no sections.")
-             # Maybe try a simpler split if the regex fails?
-             lines = [l.strip() for l in script_text.splitlines() if l.strip()]
-             if len(lines) >= 2: # Basic fallback: assume first line is title, second is text
-                 print("Attempting basic fallback parsing.")
-                 title = lines[0].replace('[','').replace(']','')
-                 narration = ' '.join(lines[1:])
-                 sections[title] = narration
-        print(f"Parsed Sections: {sections}") # Log parsed sections
         for title, narration in sections.items():
             if not title or not narration:
-                print(f"Skipping empty section: Title='{title}', Narration='{narration}'")
                 continue
-            # Use title as media prompt
-            media_element = {"type": "media", "prompt": title, "effects": "random"} # Use random Ken Burns
-            # Calculate rough duration based on words
             words = narration.split()
-            # Duration: Base 2s + 0.4s per word, capped at ~10s unless very long
-            duration = min(10.0, max(3.0, 2.0 + len(words) * 0.4))
-            tts_element = {"type": "tts", "text": narration, "voice": "en", "duration": duration} # Duration is approximate here
             elements.append(media_element)
             elements.append(tts_element)
-        if not elements:
-             print("Error: No elements created after parsing.")
         return elements
     except Exception as e:
-        print(f"Error parsing script: {e}\nScript content was:\n{script_text}")
         return []
-def search_pexels(query, api_key, media_type="videos"):
-    """Searches Pexels for videos or images."""
-    if not api_key or api_key == 'YOUR_PEXELS_API_KEY_HERE':
-        print("Error: Pexels API Key not configured.")
         return None
-    headers = {'Authorization': api_key}
-    base_url = f"https://api.pexels.com/{media_type}/search"
-    results = []
-    # Search multiple pages for better results
-    for page in range(1, 4): # Check first 3 pages
         try:
-            params = {"query": query, "per_page": 15, "page": page}
-            if media_type == "videos":
-                params["orientation"] = "landscape" if TARGET_RESOLUTION[0] > TARGET_RESOLUTION[1] else "portrait"
-            else: # images
-                 params["orientation"] = "landscape" if TARGET_RESOLUTION[0] > TARGET_RESOLUTION[1] else "portrait"
-            response = requests.get(base_url, headers=headers, params=params, timeout=15)
-            response.raise_for_status()
-            data = response.json()
-            if media_type == "videos":
-                media_items = data.get("videos", [])
-                for item in media_items:
-                    video_files = item.get("video_files", [])
-                    # Prioritize HD or FHD based on target resolution, fallback to highest available
-                    target_quality = "hd" # 1280x720 or 1920x1080
-                    if TARGET_RESOLUTION[0] >= 1920 or TARGET_RESOLUTION[1] >= 1920:
-                         target_quality = "fhd" # Often not available, but check anyway
-                    link = None
-                    for file in video_files:
-                        # Pexels uses 'hd' for 1920x1080 too sometimes
-                        if file.get("quality") == target_quality or file.get("quality") == "hd":
-                            link = file.get("link")
-                            break
-                    if not link and video_files: # Fallback to the first link if specific quality not found
-                         link = video_files[0].get("link")
-                    if link:
-                        results.append(link)
-            else: # images
-                media_items = data.get("photos", [])
-                for item in media_items:
-                    # Get original size, resizing happens later
-                    link = item.get("src", {}).get("original")
-                    if link:
-                        results.append(link)
         except requests.exceptions.RequestException as e:
-            print(f"Warning: Pexels API request failed for '{query}' (page {page}, {media_type}): {e}")
-            # Don't stop searching on a single page failure
-            continue
-        except Exception as e:
-            print(f"Warning: Unexpected error during Pexels search for '{query}': {e}")
-            continue
-    if results:
-        print(f"Found {len(results)} Pexels {media_type} for '{query}'. Choosing one randomly.")
-        return random.choice(results)
-    else:
-        print(f"Warning: No Pexels {media_type} found for query: '{query}'")
-        return None
 def search_google_images(query):
-    """Searches Google Images (use cautiously, scraping can be fragile)."""
-    print(f"Attempting Google Image search for: '{query}' (Use with caution)")
     try:
-        search_url = f"https://www.google.com/search?q={quote(query)}&tbm=isch&safe=active" # Added safe search
         headers = {"User-Agent": USER_AGENT}
-        response = requests.get(search_url, headers=headers, timeout=15)
-        response.raise_for_status()
         soup = BeautifulSoup(response.text, "html.parser")
-        image_urls = []
-        # Google changes its structure often, this might need updates
-        # Look for image data embedded in script tags or specific img tags
-        # This is a common pattern, but highly unstable
         img_tags = soup.find_all("img")
         for img in img_tags:
-            src = img.get("src") or img.get("data-src")
-            if src and src.startswith("http") and "gstatic" not in src and "googlelogo" not in src:
-                 # Basic check for valid image extensions or base64
-                 if re.search(r'\.(jpg|jpeg|png|webp)$', src, re.IGNORECASE) or src.startswith('data:image'):
-                     image_urls.append(src)
-        # Limit the number of results to avoid processing too many
-        image_urls = image_urls[:10] # Consider first 10 potential images
         if image_urls:
-            print(f"Found {len(image_urls)} potential Google Images for '{query}'. Choosing one.")
-            return random.choice(image_urls)
         else:
-            print(f"Warning: No suitable Google Images found for query: '{query}'")
             return None
-    except requests.exceptions.RequestException as e:
-        print(f"Warning: Google Image search failed for '{query}': {e}")
-        return None
     except Exception as e:
-        print(f"Warning: Error parsing Google Image search results for '{query}': {e}")
         return None
-def download_media(media_url, filename):
-    """Downloads media (image or video) from a URL."""
     try:
-        headers = {"User-Agent": USER_AGENT} # Use User-Agent for downloads too
-        response = requests.get(media_url, headers=headers, stream=True, timeout=30) # Increased timeout for large files
         response.raise_for_status()
         with open(filename, 'wb') as f:
             for chunk in response.iter_content(chunk_size=8192):
                 f.write(chunk)
-        print(f"Successfully downloaded media to {filename}")
-        # Verify image integrity and convert if necessary
-        if filename.lower().endswith(('.png', '.jpg', '.jpeg', '.webp')):
-            try:
-                img = Image.open(filename)
-                img.verify() # Verify that it is, in fact an image
-                # Re-open image for conversion check
-                img = Image.open(filename)
-                if img.mode != 'RGB':
-                    print(f"Converting image {filename} to RGB.")
-                    img = img.convert('RGB')
-                    img.save(filename, "JPEG") # Save as JPEG for compatibility
-                img.close()
-            except (IOError, SyntaxError, Image.UnidentifiedImageError) as img_e:
-                print(f"Warning: Downloaded file {filename} is not a valid image or is corrupted: {img_e}. Removing.")
                 os.remove(filename)
-                return None
-        # Basic video check (can be expanded)
-        elif filename.lower().endswith(('.mp4', '.mov', '.avi')):
-             if os.path.getsize(filename) < 1024: # Check if file is too small (likely error)
-                  print(f"Warning: Downloaded video file {filename} is suspiciously small. Removing.")
-                  os.remove(filename)
-                  return None
-        return filename
-    except requests.exceptions.RequestException as e:
-        print(f"Error downloading media from {media_url}: {e}")
         if os.path.exists(filename):
             os.remove(filename)
         return None
     except Exception as e:
-        print(f"An unexpected error occurred during media download: {e}")
         if os.path.exists(filename):
             os.remove(filename)
         return None
-def generate_media(prompt, current_index=0, total_segments=1):
-    """Generates media (video or image) based on the prompt."""
     safe_prompt = re.sub(r'[^\w\s-]', '', prompt).strip().replace(' ', '_')
-    if not safe_prompt: safe_prompt = f"media_{current_index}" # Fallback filename
-    print(f"\n--- Generating Media for Prompt: '{prompt}' ---")
-    # --- Strategy ---
-    # 1. Try Pexels Video
-    # 2. Try Pexels Image
-    # 3. If prompt contains 'news' or similar, try Google Image as fallback
-    # 4. Use generic Pexels image as last resort
-    # 1. Try Pexels Video
-    video_url = search_pexels(prompt, PEXELS_API_KEY, media_type="videos")
-    if video_url:
         video_file = os.path.join(TEMP_FOLDER, f"{safe_prompt}_video.mp4")
-        if download_media(video_url, video_file):
-            print(f"Using Pexels video for '{prompt}'")
-            return {"path": video_file, "asset_type": "video"}
         else:
-            print(f"Failed to download Pexels video for '{prompt}'.")
-    # 2. Try Pexels Image
-    image_url = search_pexels(prompt, PEXELS_API_KEY, media_type="photos")
     if image_url:
-        image_file = os.path.join(TEMP_FOLDER, f"{safe_prompt}_image.jpg")
-        if download_media(image_url, image_file):
-            print(f"Using Pexels image for '{prompt}'")
-            return {"path": image_file, "asset_type": "image"}
         else:
-            print(f"Failed to download Pexels image for '{prompt}'.")
-    # 3. Try Google Image (especially for specific/newsy terms)
-    if "news" in prompt.lower() or "breaking" in prompt.lower() or len(prompt.split()) > 4: # Heuristic for specific terms
-        google_image_url = search_google_images(prompt)
-        if google_image_url:
-            google_image_file = os.path.join(TEMP_FOLDER, f"{safe_prompt}_google_image.jpg")
-            if download_media(google_image_url, google_image_file):
-                print(f"Using Google image for '{prompt}' as fallback.")
-                return {"path": google_image_file, "asset_type": "image"}
-            else:
-                print(f"Failed to download Google image for '{prompt}'.")
-    # 4. Fallback to generic Pexels images
-    print(f"Could not find specific media for '{prompt}'. Using generic fallback.")
-    fallback_terms = ["abstract", "technology", "texture", "nature", "cityscape"]
-    random.shuffle(fallback_terms) # Try different fallbacks
     for term in fallback_terms:
-        fallback_url = search_pexels(term, PEXELS_API_KEY, media_type="photos")
         if fallback_url:
-            fallback_file = os.path.join(TEMP_FOLDER, f"fallback_{term}_{current_index}.jpg")
-            if download_media(fallback_url, fallback_file):
-                print(f"Using fallback Pexels image ('{term}')")
-                return {"path": fallback_file, "asset_type": "image"}
             else:
-                 print(f"Failed to download fallback Pexels image ('{term}')")
-    print(f"Error: Failed to generate any media for prompt: '{prompt}'")
-    return None # Failed to get any media
-def generate_tts(text, voice="en"):
-    """Generates Text-to-Speech audio using Kokoro or gTTS."""
-    safe_text = re.sub(r'[^\w\s-]', '', text[:15]).strip().replace(' ', '_')
-    if not safe_text: safe_text = f"tts_{random.randint(1000, 9999)}"
-    file_path = os.path.join(TEMP_FOLDER, f"{safe_text}.wav")
-    # Attempt Kokoro first if available
-    if pipeline:
-        try:
-            print(f"Generating TTS with Kokoro for: '{text[:30]}...'")
-            # Kokoro specific voice if needed, 'en' might map internally or use a default
-            # The original code used 'af_heart' for 'en', let's try that logic
-            kokoro_voice = 'af_heart' if voice == 'en' else voice # Adjust if Kokoro has different voice codes
-            generator = pipeline(text, voice=kokoro_voice, speed=0.95, split_pattern=r'\n+|[.!?]+') # Adjust speed/split
-            audio_segments = [audio for _, _, audio in generator]
-            if not audio_segments:
-                 raise ValueError("Kokoro returned no audio segments.")
-            # Ensure segments are numpy arrays before concatenating
-            valid_segments = [seg for seg in audio_segments if isinstance(seg, np.ndarray) and seg.size > 0]
-            if not valid_segments:
-                 raise ValueError("Kokoro returned empty or invalid audio segments.")
-            full_audio = np.concatenate(valid_segments) if len(valid_segments) > 0 else valid_segments[0]
-            # Ensure audio is float32 for soundfile
-            if full_audio.dtype != np.float32:
-                full_audio = full_audio.astype(np.float32)
-                # Normalize if needed (Kokoro might output integers)
-                max_val = np.max(np.abs(full_audio))
-                if max_val > 1.0:
-                    full_audio /= max_val
-            sf.write(file_path, full_audio, 24000) # Kokoro typically outputs at 24kHz
-            print(f"Kokoro TTS generated successfully: {file_path}")
-            return file_path
-        except Exception as e:
-            print(f"Warning: Kokoro TTS failed: {e}. Falling back to gTTS.")
-            # Fall through to gTTS
-    # Fallback to gTTS
     try:
-        print(f"Generating TTS with gTTS for: '{text[:30]}...'")
-        tts = gTTS(text=text, lang=voice, slow=False) # Use voice as language code for gTTS
-        # Save as mp3 first, then convert
-        mp3_path = os.path.join(TEMP_FOLDER, f"tts_{safe_text}.mp3")
-        tts.save(mp3_path)
-        audio = AudioSegment.from_mp3(mp3_path)
-        # Export as WAV for consistency with moviepy
-        audio.export(file_path, format="wav")
-        os.remove(mp3_path) # Clean up temporary mp3
-        print(f"gTTS TTS generated successfully: {file_path}")
         return file_path
     except Exception as e:
-        print(f"Error: gTTS also failed: {e}. Generating silence.")
-        # Final fallback: generate silence
         try:
-            # Estimate duration based on text length (similar to parsing logic)
-            words = text.split()
-            duration_seconds = min(10.0, max(3.0, 2.0 + len(words) * 0.4))
-            samplerate = 24000 # Match Kokoro's typical rate
-            num_samples = int(duration_seconds * samplerate)
-            silence = np.zeros(num_samples, dtype=np.float32)
-            sf.write(file_path, silence, samplerate)
-            print(f"Generated silence fallback: {file_path} ({duration_seconds:.1f}s)")
             return file_path
-        except Exception as silence_e:
-             print(f"Error: Failed even to generate silence: {silence_e}")
-             return None # Complete failure
-def apply_kenburns_effect(clip, target_resolution, effect_type="random"):
-    """Applies a Ken Burns effect (zoom/pan) to an ImageClip."""
     target_w, target_h = target_resolution
-    # Ensure clip has dimensions (might be needed if ImageClip wasn't fully initialized)
-    if not hasattr(clip, 'w') or not hasattr(clip, 'h') or clip.w == 0 or clip.h == 0:
-         print("Warning: Clip dimensions not found for Ken Burns effect. Using target resolution.")
-         # Attempt to get frame to determine size, or default
-         try:
-              frame = clip.get_frame(0)
-              clip.w, clip.h = frame.shape[1], frame.shape[0]
-         except:
-              clip.w, clip.h = target_w, target_h # Fallback
-    # Resize image to cover target area while maintaining aspect ratio
     clip_aspect = clip.w / clip.h
     target_aspect = target_w / target_h
-    if clip_aspect > target_aspect: # Image is wider than target
         new_height = target_h
         new_width = int(new_height * clip_aspect)
-    else: # Image is taller than target
         new_width = target_w
         new_height = int(new_width / clip_aspect)
-    # Resize slightly larger than needed for the effect
-    base_scale = 1.20 # Zoom factor range
-    zoom_width = int(new_width * base_scale)
-    zoom_height = int(new_height * base_scale)
-    # Use PIL for initial resize - often better quality for large changes
-    try:
-        pil_img = Image.fromarray(clip.get_frame(0)) # Get frame as PIL image
-        resized_pil = pil_img.resize((zoom_width, zoom_height), Image.Resampling.LANCZOS)
-        resized_clip = ImageClip(np.array(resized_pil)).set_duration(clip.duration)
-        clip = resized_clip # Use the better resized clip
-        clip.w, clip.h = zoom_width, zoom_height # Update dimensions
-    except Exception as pil_e:
-        print(f"Warning: PIL resize failed ({pil_e}). Using moviepy resize.")
-        clip = clip.resize(newsize=(zoom_width, zoom_height))
-    # Calculate max offsets for panning
-    max_offset_x = max(0, clip.w - target_w)
-    max_offset_y = max(0, clip.h - target_h)
-    # Define effect types
-    available_effects = ["zoom-in", "zoom-out", "pan-left", "pan-right", "pan-up", "pan-down", "slow-zoom"]
-    if effect_type == "random":
-        effect_type = random.choice(available_effects)
-    print(f"Applying Ken Burns effect: {effect_type}")
-    # Determine start/end zoom and center positions based on effect
-    start_zoom, end_zoom = 1.0, 1.0
-    start_center_x, start_center_y = clip.w / 2, clip.h / 2
-    end_center_x, end_center_y = clip.w / 2, clip.h / 2
     if effect_type == "zoom-in":
-        start_zoom = 1.0
-        end_zoom = 1 / base_scale # Zoom factor applied to crop size
     elif effect_type == "zoom-out":
-        start_zoom = 1 / base_scale
-        end_zoom = 1.0
-    elif effect_type == "slow-zoom":
-         start_zoom = 1.0
-         end_zoom = 1 / 1.05 # Very subtle zoom in
     elif effect_type == "pan-left":
-        start_center_x = target_w / 2
-        end_center_x = clip.w - target_w / 2
-        start_center_y = end_center_y = clip.h / 2 # Center vertically
     elif effect_type == "pan-right":
-        start_center_x = clip.w - target_w / 2
-        end_center_x = target_w / 2
-        start_center_y = end_center_y = clip.h / 2
-    elif effect_type == "pan-up":
-        start_center_y = target_h / 2
-        end_center_y = clip.h - target_h / 2
-        start_center_x = end_center_x = clip.w / 2 # Center horizontally
-    elif effect_type == "pan-down":
-        start_center_y = clip.h - target_h / 2
-        end_center_y = target_h / 2
-        start_center_x = end_center_x = clip.w / 2
-    # Add more effects like diagonal pans if desired
     def transform_frame(get_frame, t):
-        frame = get_frame(t) # Get the frame from the (potentially PIL-resized) clip
-        # Smooth interpolation (ease-in, ease-out)
-        ratio = 0.5 - 0.5 * math.cos(math.pi * t / clip.duration) if clip.duration > 0 else 0
         current_zoom = start_zoom + (end_zoom - start_zoom) * ratio
         crop_w = int(target_w / current_zoom)
         crop_h = int(target_h / current_zoom)
-        # Ensure crop dimensions are not larger than the frame itself
-        crop_w = min(crop_w, clip.w)
-        crop_h = min(crop_h, clip.h)
-        current_center_x = start_center_x + (end_center_x - start_center_x) * ratio
-        current_center_y = start_center_y + (end_center_y - start_center_y) * ratio
-        # Clamp center position to avoid cropping outside the image boundaries
         min_center_x = crop_w / 2
-        max_center_x = clip.w - crop_w / 2
         min_center_y = crop_h / 2
-        max_center_y = clip.h - crop_h / 2
         current_center_x = max(min_center_x, min(current_center_x, max_center_x))
         current_center_y = max(min_center_y, min(current_center_y, max_center_y))
-        # Perform the crop using cv2.getRectSubPix for subpixel accuracy
-        # Ensure frame is contiguous array for cv2
-        if not frame.flags['C_CONTIGUOUS']:
-             frame = np.ascontiguousarray(frame)
-        try:
-            cropped_frame = cv2.getRectSubPix(frame, (crop_w, crop_h), (current_center_x, current_center_y))
-            # Resize the cropped area to the final target resolution
-            # Using LANCZOS4 for potentially better quality resizing
-            final_frame = cv2.resize(cropped_frame, (target_w, target_h), interpolation=cv2.INTER_LANCZOS4)
-            return final_frame
-        except cv2.error as cv2_err:
-             print(f"Error during cv2 operation in Ken Burns: {cv2_err}")
-             print(f"Frame shape: {frame.shape}, Crop W/H: {crop_w}/{crop_h}, Center X/Y: {current_center_x}/{current_center_y}")
-             # Fallback: return uncropped frame resized? Or black frame?
-             return cv2.resize(frame, (target_w, target_h), interpolation=cv2.INTER_LINEAR) # Fallback resize
-    # Apply the transformation function to the clip
-    return clip.fl(transform_frame, apply_to=['mask']) # Apply to mask if it exists
 def resize_to_fill(clip, target_resolution):
-    """Resizes a video clip to fill the target resolution, cropping if necessary."""
     target_w, target_h = target_resolution
-    clip_w, clip_h = clip.w, clip.h
-    if clip_w == 0 or clip_h == 0:
-        print("Warning: Clip has zero dimensions before resize_to_fill. Cannot resize.")
-        # Return a black clip of the target size?
-        return ColorClip(size=target_resolution, color=(0,0,0), duration=clip.duration)
-    clip_aspect = clip_w / clip_h
     target_aspect = target_w / target_h
-    if math.isclose(clip_aspect, target_aspect, rel_tol=1e-3):
-        # Aspect ratios are close enough, just resize
-        print(f"Resizing video clip {clip.filename} to {target_resolution} (aspect match).")
-        return clip.resize(newsize=target_resolution)
-    elif clip_aspect > target_aspect:
-        # Clip is wider than target aspect ratio, resize to target height and crop width
-        print(f"Resizing video clip {clip.filename} to height {target_h} and cropping width.")
         clip = clip.resize(height=target_h)
-        # Calculate amount to crop from each side
         crop_amount = (clip.w - target_w) / 2
-        if crop_amount < 0: # Avoid negative crop
-             print("Warning: Negative crop amount calculated in resize_to_fill (width). Resizing only.")
-             return clip.resize(newsize=target_resolution)
-        return clip.crop(x1=crop_amount, width=target_w)
     else:
-        # Clip is taller than target aspect ratio, resize to target width and crop height
-        print(f"Resizing video clip {clip.filename} to width {target_w} and cropping height.")
         clip = clip.resize(width=target_w)
-        # Calculate amount to crop from top/bottom
         crop_amount = (clip.h - target_h) / 2
-        if crop_amount < 0: # Avoid negative crop
-             print("Warning: Negative crop amount calculated in resize_to_fill (height). Resizing only.")
-             return clip.resize(newsize=target_resolution)
-        return clip.crop(y1=crop_amount, height=target_h)
-def add_background_music(final_video, bg_music_path=BACKGROUND_MUSIC_PATH, bg_music_volume=0.08):
-    """Adds background music to the final video."""
-    if not os.path.exists(bg_music_path):
-        print(f"Warning: Background music file not found at {bg_music_path}. Skipping.")
-        return final_video
     try:
-        print("Adding background music...")
-        bg_music = AudioFileClip(bg_music_path)
-        if final_video.duration is None or final_video.duration <= 0:
-             print("Warning: Final video has no duration. Cannot add background music.")
-             return final_video
-        if bg_music.duration is None or bg_music.duration <= 0:
-             print("Warning: Background music has no duration. Skipping.")
-             return final_video
-        # Loop or trim background music to match video duration
-        if bg_music.duration < final_video.duration:
-            loops_needed = math.ceil(final_video.duration / bg_music.duration)
-            print(f"Looping background music {loops_needed} times.")
-            bg_music = concatenate_audioclips([bg_music] * loops_needed)
-        # Trim to exact duration
-        bg_music = bg_music.subclip(0, final_video.duration)
-        # Adjust volume
-        bg_music = bg_music.volumex(bg_music_volume)
-        # Combine with existing audio (if any)
-        video_audio = final_video.audio
-        if video_audio:
-            # Normalize main audio slightly? Optional.
-            # video_audio = video_audio.volumex(1.0) # Keep original volume
-            print("Mixing existing audio with background music.")
             mixed_audio = CompositeAudioClip([video_audio, bg_music])
         else:
-            print("No existing audio found. Using only background music.")
-            mixed_audio = bg_music
-        # Set the new audio track
-        final_video = final_video.set_audio(mixed_audio)
-        print("Background music added successfully.")
         return final_video
     except Exception as e:
         print(f"Error adding background music: {e}")
-        # Return the original video without crashing
         return final_video
 def create_clip(media_path, asset_type, tts_path, duration=None, effects=None, narration_text=None, segment_index=0):
-    """Creates a single video clip segment with media, audio, and optional captions."""
-    print(f"\n--- Creating Clip Segment {segment_index} ---")
-    print(f"Media: {media_path} ({asset_type})")
-    print(f"TTS: {tts_path}")
-    print(f"Narration: '{narration_text[:50]}...'")
     try:
-        # Validate inputs
-        if not media_path or not os.path.exists(media_path):
-            print(f"Error: Media path not found or invalid: {media_path}")
-            return None
-        if not tts_path or not os.path.exists(tts_path):
-            print(f"Error: TTS path not found or invalid: {tts_path}")
-            # Attempt to use media without audio? Or fail? Let's fail for now.
             return None
-        # Load audio first to determine duration
-        audio_clip = AudioFileClip(tts_path)
-        # Add slight fade out to avoid abrupt cuts
-        audio_clip = audio_clip.audio_fadeout(0.2)
-        target_duration = audio_clip.duration
-        if target_duration is None or target_duration <= 0.1: # Check for valid duration
-             print(f"Warning: Audio clip {tts_path} has invalid duration ({target_duration}). Estimating 3 seconds.")
-             target_duration = 3.0 # Fallback duration
-             # Recreate audio clip with fixed duration if possible? Or just use the duration.
-             audio_clip = audio_clip.set_duration(target_duration)
-        print(f"Audio Duration: {target_duration:.2f}s")
-        # --- Create Video/Image Clip ---
-        clip = None
         if asset_type == "video":
-            try:
-                clip = VideoFileClip(media_path, target_resolution=TARGET_RESOLUTION[::-1]) # Provide target res hint
-                # Ensure video has audio track removed initially if we overlay TTS fully
-                clip = clip.without_audio()
-                # Resize/Crop to fill target resolution
-                clip = resize_to_fill(clip, TARGET_RESOLUTION)
-                # Loop or cut video to match audio duration
-                if clip.duration < target_duration:
-                    print(f"Looping video (duration {clip.duration:.2f}s) to match audio.")
-                    clip = clip.loop(duration=target_duration)
-                else:
-                    # Start from a random point if video is longer? Or just take the start?
-                    start_time = 0
-                    # Optional: random start time if video is much longer
-                    # if clip.duration > target_duration + 2:
-                    #    start_time = random.uniform(0, clip.duration - target_duration)
-                    print(f"Subclipping video from {start_time:.2f}s to {start_time + target_duration:.2f}s.")
-                    clip = clip.subclip(start_time, start_time + target_duration)
-                # Add fade in/out for smoother transitions
-                clip = clip.fadein(0.3).fadeout(0.3)
-            except Exception as video_e:
-                print(f"Error processing video file {media_path}: {video_e}")
-                # Fallback to a black screen?
-                clip = ColorClip(size=TARGET_RESOLUTION, color=(0,0,0), duration=target_duration)
         elif asset_type == "image":
-            try:
-                # Use tempfile for converted image if needed (handled in download now)
-                # Load image clip
-                clip = ImageClip(media_path).set_duration(target_duration)
-                # Apply Ken Burns effect
-                clip = apply_kenburns_effect(clip, TARGET_RESOLUTION, effect_type=effects or "random")
-                # Fades are good for images too
-                clip = clip.fadein(0.3).fadeout(0.3)
-            except Exception as img_e:
-                 print(f"Error processing image file {media_path}: {img_e}")
-                 # Fallback to a grey screen?
-                 clip = ColorClip(size=TARGET_RESOLUTION, color=(50,50,50), duration=target_duration)
         else:
-            print(f"Error: Unknown asset type '{asset_type}'")
-            return None # Unknown type
-        # Ensure clip has the correct duration after processing
-        clip = clip.set_duration(target_duration)
-        # --- Add Captions ---
-        subtitle_clips = []
         if narration_text and CAPTION_COLOR != "transparent":
-            print("Adding captions...")
             try:
-                # Simple word splitting for timing (can be improved with proper SRT/timing info)
                 words = narration_text.split()
-                words_per_chunk = 5 # Adjust number of words per caption line
-                chunks = [' '.join(words[i:i+words_per_chunk]) for i in range(0, len(words), words_per_chunk)]
-                if not chunks: chunks = [narration_text] # Handle empty or short text
-                chunk_duration = target_duration / len(chunks) if len(chunks) > 0 else target_duration
-                # Calculate font size based on resolution (heuristic)
-                font_size = int(TARGET_RESOLUTION[1] / 25) # Adjust divisor as needed
-                # Position captions towards the bottom
-                subtitle_y_position = int(TARGET_RESOLUTION[1] * 0.85) # Lower position
                 for i, chunk_text in enumerate(chunks):
                     start_time = i * chunk_duration
-                    # Ensure end time doesn't exceed clip duration
-                    end_time = min((i + 1) * chunk_duration, target_duration)
-                    # Avoid zero-duration captions
-                    if end_time <= start_time: end_time = start_time + 0.1
-                    # Create TextClip for the chunk
-                    # Ensure font is available in the environment (Arial is common, but might need install)
-                    # Added stroke for better visibility
                     txt_clip = TextClip(
                         chunk_text,
-                        fontsize=font_size,
-                        font='Arial-Bold', # Ensure this font is available or choose another like 'Liberation-Sans-Bold'
                         color=CAPTION_COLOR,
-                        bg_color='rgba(0, 0, 0, 0.5)', # Slightly darker background
-                        method='caption', # Wraps text
                         align='center',
-                        stroke_color='black', # Black stroke
-                        stroke_width=max(1, font_size // 20), # Stroke width relative to font size
-                        size=(TARGET_RESOLUTION[0] * 0.85, None) # Limit width
-                    ).set_start(start_time).set_duration(end_time - start_time).set_position(('center', subtitle_y_position))
                     subtitle_clips.append(txt_clip)
-                # Composite the main clip with subtitles
-                if subtitle_clips:
-                    clip = CompositeVideoClip([clip] + subtitle_clips, size=TARGET_RESOLUTION)
-                    print(f"Added {len(subtitle_clips)} caption segments.")
-            except Exception as caption_e:
-                # This often happens if ImageMagick or fonts are missing/misconfigured
-                print(f"ERROR: Failed to create captions: {caption_e}")
-                print("Check if ImageMagick is installed and configured, and if the font (e.g., Arial-Bold) is available.")
-                # Continue without captions if they fail
-        # Set the audio track
         clip = clip.set_audio(audio_clip)
-        print(f"Clip Segment {segment_index} created successfully.")
         return clip
     except Exception as e:
-        print(f"FATAL ERROR creating clip segment {segment_index}: {e}")
-        import traceback
-        traceback.print_exc() # Print detailed traceback for debugging
-        # Return a short, silent black clip to avoid crashing the concatenation
-        return ColorClip(size=TARGET_RESOLUTION, color=(0,0,0), duration=1.0).set_audio(None)
-# Main Gradio Function
-def generate_video(video_concept, resolution_choice, caption_option):
-    """The main function called by Gradio to generate the video."""
-    print("\n\n--- Starting Video Generation ---")
-    print(f"Concept: {video_concept}")
-    print(f"Resolution: {resolution_choice}")
-    print(f"Captions: {caption_option}")
-    global TARGET_RESOLUTION, CAPTION_COLOR
-    # Set global config based on input
-    if resolution_choice == "Short (9:16)":
-        TARGET_RESOLUTION = (1080, 1920)
-    else: # Default to Full HD
         TARGET_RESOLUTION = (1920, 1080)
-    CAPTION_COLOR = "white" if caption_option == "Yes" else "transparent" # Use "transparent" to disable
-    # --- Cleanup and Setup ---
-    if os.path.exists(TEMP_FOLDER):
-        print(f"Removing existing temp folder: {TEMP_FOLDER}")
-        shutil.rmtree(TEMP_FOLDER)
-    try:
-        os.makedirs(TEMP_FOLDER)
-        print(f"Created temp folder: {TEMP_FOLDER}")
-    except OSError as e:
-         print(f"Error creating temp folder {TEMP_FOLDER}: {e}")
-         return f"Error: Could not create temporary directory. Check permissions. {e}" # Return error message to Gradio
-    # --- Script Generation ---
-    print("Generating script...")
-    script = generate_script(video_concept)
-    if not script:
-        print("Error: Failed to generate script.")
-        shutil.rmtree(TEMP_FOLDER) # Clean up
-        return "Error: Failed to generate script from AI. Please try a different concept or check API keys." # Return error message
-    # --- Script Parsing ---
-    print("Parsing script...")
     elements = parse_script(script)
     if not elements:
-        print("Error: Failed to parse script into elements.")
-        shutil.rmtree(TEMP_FOLDER) # Clean up
-        return "Error: Failed to parse the generated script. The script might be malformed." # Return error message
-    # Pair media prompts with TTS elements
     paired_elements = []
-    if len(elements) >= 2:
-        for i in range(0, len(elements), 2):
-            if i + 1 < len(elements) and elements[i]['type'] == 'media' and elements[i+1]['type'] == 'tts':
-                paired_elements.append((elements[i], elements[i+1]))
-            else:
-                 print(f"Warning: Skipping mismatched elements at index {i}")
     if not paired_elements:
-        print("Error: No valid media/TTS pairs found after parsing.")
-        shutil.rmtree(TEMP_FOLDER) # Clean up
-        return "Error: Could not find valid [Title]/Narration pairs in the script." # Return error message
-    print(f"Found {len(paired_elements)} pairs of media prompts and narrations.")
-    # --- Clip Generation Loop ---
     clips = []
-    total_segments = len(paired_elements)
     for idx, (media_elem, tts_elem) in enumerate(paired_elements):
-        print(f"\nProcessing Segment {idx+1}/{total_segments}: Prompt='{media_elem['prompt']}'")
-        # 1. Generate Media (Video/Image)
-        media_asset = generate_media(media_elem['prompt'], current_index=idx, total_segments=total_segments)
-        if not media_asset or not media_asset.get('path'):
-            print(f"Warning: Failed to generate media for '{media_elem['prompt']}'. Skipping segment.")
-            # Option: Create a placeholder clip instead of skipping?
-            # clips.append(ColorClip(size=TARGET_RESOLUTION, color=(20,0,0), duration=3.0)) # Short red flash?
-            continue # Skip this segment
-        # 2. Generate TTS
         tts_path = generate_tts(tts_elem['text'], tts_elem['voice'])
         if not tts_path:
-            print(f"Warning: Failed to generate TTS for segment {idx}. Skipping segment.")
-            # Option: Create clip without audio? Requires adjusting create_clip
-            continue # Skip this segment
-        # 3. Create MoviePy Clip Segment
         clip = create_clip(
             media_path=media_asset['path'],
             asset_type=media_asset['asset_type'],
             tts_path=tts_path,
-            duration=tts_elem['duration'], # Duration hint (create_clip prioritizes actual audio length)
-            effects=media_elem.get('effects', 'random'),
             narration_text=tts_elem['text'],
             segment_index=idx
         )
         if clip:
             clips.append(clip)
         else:
-            print(f"Warning: Failed to create clip for segment {idx}. Skipping.")
-            # Maybe add a fallback black clip here too?
-    # --- Final Video Assembly ---
     if not clips:
-        print("Error: No clips were successfully created.")
-        shutil.rmtree(TEMP_FOLDER) # Clean up
-        return "Error: Failed to create any video segments. Check logs for media/TTS/clip creation errors." # Return error message
-    print(f"\nConcatenating {len(clips)} video clips...")
-    try:
-        # Concatenate all the generated clips
-        final_video = concatenate_videoclips(clips, method="compose") # 'compose' handles transparency if needed
-    except Exception as concat_e:
-        print(f"Error during video concatenation: {concat_e}")
         shutil.rmtree(TEMP_FOLDER)
-        return f"Error: Failed to combine video segments: {concat_e}"
-    # --- Add Background Music ---
-    final_video = add_background_music(final_video, bg_music_volume=0.08) # Adjust volume as needed
-    # --- Write Output File ---
-    print(f"Writing final video to {OUTPUT_VIDEO_FILENAME}...")
-    try:
-        # Write the final video file
-        # Use preset 'medium' or 'slow' for better quality/compression ratio if time allows
-        # Use 'libx264' for wide compatibility, 'aac' for audio codec
-        # threads=4 can speed up encoding on multi-core CPUs
-        final_video.write_videofile(
-            OUTPUT_VIDEO_FILENAME,
-            codec='libx264',
-            audio_codec='aac',
-            fps=24, # Standard frame rate
-            preset='medium', # 'veryfast', 'fast', 'medium', 'slow', 'veryslow'
-            threads=4, # Adjust based on CPU cores
-            logger='bar' # Show progress bar
-            )
-        print("Final video written successfully.")
-    except Exception as write_e:
-        print(f"Error writing final video file: {write_e}")
-        shutil.rmtree(TEMP_FOLDER)
-        return f"Error: Failed to write the final video file: {write_e}"
-    finally:
-        # --- Cleanup ---
-        # Close clips to release file handles (important on some OS)
-        for clip in clips:
-            clip.close()
-        if final_video:
-             final_video.close()
-        if 'bg_music' in locals() and bg_music: # Close bg music if loaded
-            bg_music.close()
-        if 'audio_clip' in locals() and audio_clip: # Close last audio clip
-            audio_clip.close()
-        print(f"Cleaning up temporary folder: {TEMP_FOLDER}")
-        shutil.rmtree(TEMP_FOLDER)
-    print("--- Video Generation Complete ---")
-    # Return the path to the generated video for Gradio
     return OUTPUT_VIDEO_FILENAME
-# --- Gradio Interface Definition ---
-with gr.Blocks(theme=gr.themes.Soft()) as demo:
-    gr.Markdown(
-        """
-        # 🎬 AI Documentary Video Generator 🎥
-        Enter a concept or topic, and the AI will generate a short, humorous documentary-style video.
-        Configure API keys (Pexels, OpenRouter) and ensure `background_music.mp3` exists before running.
-        """
-    )
-    with gr.Row():
-        with gr.Column(scale=2):
-            video_concept = gr.Textbox(
-                label="Video Concept / Topic / Script",
-                placeholder="e.g., 'The secret life of squirrels', 'Why cats secretly judge us', or paste a full script starting with [Title]...",
-                lines=4
-            )
-            with gr.Row():
-                 resolution = gr.Dropdown(
-                     ["Full HD (16:9)", "Short (9:16)"],
-                     label="Resolution",
-                     value="Full HD (16:9)"
-                 )
-                 caption_option = gr.Dropdown(
-                     ["Yes", "No"],
-                     label="Add Captions",
-                     value="Yes"
-                 )
-            generate_btn = gr.Button("✨ Generate Video ✨", variant="primary")
-        with gr.Column(scale=3):
-            output_video = gr.Video(label="Generated Video")
-            status_message = gr.Textbox(label="Status", interactive=False) # To show errors or progress
-    # Connect button click to the main function
-    generate_btn.click(
-        fn=generate_video,
-        inputs=[video_concept, resolution, caption_option],
-        outputs=[output_video] # Can also output to status_message if needed
-        # Example with status: outputs=[output_video, status_message]
-    )
-# Launch the Gradio app
-if __name__ == "__main__":
-    # Check for background music file on startup
-    if not os.path.exists(BACKGROUND_MUSIC_PATH):
-        print(f"\n*** WARNING: Background music file '{BACKGROUND_MUSIC_PATH}' not found. Background music will be skipped. ***\n")
-    demo.launch(debug=True) # debug=True provides more detailed logs

+# Install necessary packages
+!pip install transformers==4.49.0
+!pip install moviepy gTTS requests pydub pillow
+!pip cache purge
+!apt-get install imagemagick -y
+!pip install kokoro>=0.3.4 soundfile
+!apt-get-qq -y install espeak-ng > /dev/null 2>&1
+!pip install pysrt
+!pip install gradio  # Added Gradio installation
+# Import necessary libraries
+from kokoro import KPipeline
+from IPython.display import display, Audio
+import soundfile as sf
+import torch
+from IPython.display import display, Audio, HTML
+import soundfile as sf
 import os
+from moviepy.editor import VideoFileClip, AudioFileClip, ImageClip
+from PIL import Image
+import tempfile
 import random
 import cv2
+import math
+import os, requests, io, time, re, random
+from moviepy.editor import (
+    VideoFileClip, concatenate_videoclips, AudioFileClip, ImageClip,
+    CompositeVideoClip, TextClip
+)
+import moviepy.video.fx.all as vfx
+import moviepy.config as mpy_config
+from pydub import AudioSegment
+from pydub.generators import Sine
+from google.colab import files
+from PIL import Image, ImageDraw, ImageFont
 import numpy as np
 from bs4 import BeautifulSoup
+import base64
 from urllib.parse import quote
+import pysrt
 from gtts import gTTS
+import gradio as gr  # Import Gradio
+# Initialize Kokoro TTS pipeline (using American English)
+pipeline = KPipeline(lang_code='a')  # Use voice 'af_heart' for American English
+# Ensure ImageMagick binary is set
+mpy_config.change_settings({"IMAGEMAGICK_BINARY": "/usr/bin/convert"})
+# ---------------- Global Configuration ---------------- #
+PEXELS_API_KEY = 'BhJqbcdm9Vi90KqzXKAhnEHGsuFNv4irXuOjWtT761U49lRzo03qBGna'
+OPENROUTER_API_KEY = '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'
+OPENROUTER_MODEL = "mistralai/mistral-small-3.1-24b-instruct:free"
 OUTPUT_VIDEO_FILENAME = "final_video.mp4"
 USER_AGENT = "Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/91.0.4472.124 Safari/537.36"
+# ---------------- Helper Functions ---------------- #
+# (Your existing helper functions remain unchanged: generate_script, parse_script,
+# search_pexels_videos, search_pexels_images, search_google_images, download_image,
+# download_video, generate_media, generate_tts, apply_kenburns_effect,
+# resize_to_fill, find_mp3_files, add_background_music, create_clip,
+# fix_imagemagick_policy)
+# Define these globally as they were in your original code but will be set per run
+TARGET_RESOLUTION = None
+CAPTION_COLOR = None
+TEMP_FOLDER = None
 def generate_script(user_input):
+    """Generate documentary script with proper OpenRouter handling."""
     headers = {
         'Authorization': f'Bearer {OPENROUTER_API_KEY}',
+        'HTTP-Referer': 'https://your-domain.com',
+        'X-Title': 'AI Documentary Maker'
     }
+    prompt = f"""Short Documentary Script GeneratorInstructions:
 If I say "use this," just output the script exactly as I gave it.
 If I only give topics, generate a script based on them.
+If I provide a full script, rewrite it without any changes. Make everything short simple and humarous funny and act as serious but humarous. And don't say anything off topic. Also alway say a funny statement to subscribe based on the video topic at the end. Use normal conversational text like a normal person talking and avoid AI phase make the statements humanize and normal conversational
+And always talk negative views don't really wants any positive statement and the full script will be one video about one topic so keep in mind
 Formatting Rules:
+Title in Square Brackets:
+Each section starts with a one-word title inside [ ] (max two words if necessary).
+This title will be used as a search term for Pexels footage.
+Casual & Funny Narration:
+Each section has 5-10 words of narration.
+Keep it natural, funny, and unpredictable (not robotic, poetic, or rhythmic).
+No Special Formatting:
+No bold, italics, or special characters. You are a assistant AI your task is to create script. You aren't a chatbot. So, don't write extra text
+Generalized Search Terms:
+If a term is too specific, make it more general for Pexels search.
+Scene-Specific Writing:
+Each section describes only what should be shown in the video.
+Output Only the Script, and also make it funny and humarous and helirous and also add to subscribe with a funny statement like subscribe now or .....
+No extra text, just the script.
 Example Output:
 [North Korea]
+Top 5 unknown facts about North Korea.
 [Invisibility]
+North Korea’s internet speed is so fast… it doesn’t exist.
 [Leadership]
+Kim Jong-un once won an election with 100% votes… against himself.
 [Magic]
+North Korea discovered time travel. That’s why their news is always from the past.
 [Warning]
+Subscribe now, or Kim Jong-un will send you a free one-way ticket… to North Korea.
 [Freedom]
+North Korean citizens can do anything… as long as it's government-approved.
+Now here is the Topic/scrip: {user_input}
 """
     data = {
         'model': OPENROUTER_MODEL,
         'messages': [{'role': 'user', 'content': prompt}],
+        'temperature': 0.4,
+        'max_tokens': 5000
     }
     try:
         response = requests.post(
             'https://openrouter.ai/api/v1/chat/completions',
             headers=headers,
             json=data,
+            timeout=30
         )
+        if response.status_code == 200:
+            response_data = response.json()
+            if 'choices' in response_data and len(response_data['choices']) > 0:
+                return response_data['choices'][0]['message']['content']
+            else:
+                print("Unexpected response format:", response_data)
+                return None
         else:
+            print(f"API Error {response.status_code}: {response.text}")
             return None
     except Exception as e:
+        print(f"Request failed: {str(e)}")
         return None
 def parse_script(script_text):
+    """
+    Parse the generated script into a list of elements.
+    For each section, create two elements:
+      - A 'media' element using the section title as the visual prompt.
+      - A 'tts' element with the narration text, voice info, and computed duration.
+    """
     sections = {}
     current_title = None
     current_text = ""
     try:
         for line in script_text.splitlines():
             line = line.strip()
+            if line.startswith("[") and "]" in line:
+                bracket_start = line.find("[")
+                bracket_end = line.find("]", bracket_start)
+                if bracket_start != -1 and bracket_end != -1:
+                    if current_title is not None:
+                        sections[current_title] = current_text.strip()
+                    current_title = line[bracket_start+1:bracket_end]
+                    current_text = line[bracket_end+1:].strip()
+            elif current_title:
+                current_text += line + " "
+        if current_title:
             sections[current_title] = current_text.strip()
         elements = []
         for title, narration in sections.items():
             if not title or not narration:
                 continue
+            media_element = {"type": "media", "prompt": title, "effects": "fade-in"}
             words = narration.split()
+            duration = max(3, len(words) * 0.5)
+            tts_element = {"type": "tts", "text": narration, "voice": "en", "duration": duration}
             elements.append(media_element)
             elements.append(tts_element)
         return elements
     except Exception as e:
+        print(f"Error parsing script: {e}")
         return []
+def search_pexels_videos(query, pexels_api_key):
+    """Search for a video on Pexels by query and return a random HD video."""
+    headers = {'Authorization': pexels_api_key}
+    base_url = "https://api.pexels.com/videos/search"
+    num_pages = 3
+    videos_per_page = 15
+    max_retries = 3
+    retry_delay = 1
+    search_query = query
+    all_videos = []
+    for page in range(1, num_pages + 1):
+        for attempt in range(max_retries):
+            try:
+                params = {"query": search_query, "per_page": videos_per_page, "page": page}
+                response = requests.get(base_url, headers=headers, params=params, timeout=10)
+                if response.status_code == 200:
+                    data = response.json()
+                    videos = data.get("videos", [])
+                    if not videos:
+                        print(f"No videos found on page {page}.")
+                        break
+                    for video in videos:
+                        video_files = video.get("video_files", [])
+                        for file in video_files:
+                            if file.get("quality") == "hd":
+                                all_videos.append(file.get("link"))
+                                break
+                    break
+                elif response.status_code == 429:
+                    print(f"Rate limit hit (attempt {attempt+1}/{max_retries}). Retrying in {retry_delay} seconds...")
+                    time.sleep(retry_delay)
+                    retry_delay *= 2
+                else:
+                    print(f"Error fetching videos: {response.status_code} {response.text}")
+                    if attempt < max_retries - 1:
+                        print(f"Retrying in {retry_delay} seconds...")
+                        time.sleep(retry_delay)
+                        retry_delay *= 2
+                    else:
+                        break
+            except requests.exceptions.RequestException as e:
+                print(f"Request exception: {e}")
+                if attempt < max_retries - 1:
+                    print(f"Retrying in {retry_delay} seconds...")
+                    time.sleep(retry_delay)
+                    retry_delay *= 2
+                else:
+                    break
+    if all_videos:
+        random_video = random.choice(all_videos)
+        print(f"Selected random video from {len(all_videos)} HD videos")
+        return random_video
+    else:
+        print("No suitable videos found after searching all pages.")
         return None
+def search_pexels_images(query, pexels_api_key):
+    """Search for an image on Pexels by query."""
+    headers = {'Authorization': pexels_api_key}
+    url = "https://api.pexels.com/v1/search"
+    params = {"query": query, "per_page": 5, "orientation": "landscape"}
+    max_retries = 3
+    retry_delay = 1
+    for attempt in range(max_retries):
         try:
+            response = requests.get(url, headers=headers, params=params, timeout=10)
+            if response.status_code == 200:
+                data = response.json()
+                photos = data.get("photos", [])
+                if photos:
+                    photo = random.choice(photos[:min(5, len(photos))])
+                    img_url = photo.get("src", {}).get("original")
+                    return img_url
+                else:
+                    print(f"No images found for query: {query}")
+                    return None
+            elif response.status_code == 429:
+                print(f"Rate limit hit (attempt {attempt+1}/{max_retries}). Retrying in {retry_delay} seconds...")
+                time.sleep(retry_delay)
+                retry_delay *= 2
+            else:
+                print(f"Error fetching images: {response.status_code} {response.text}")
+                if attempt < max_retries - 1:
+                    print(f"Retrying in {retry_delay} seconds...")
+                    time.sleep(retry_delay)
+                    retry_delay *= 2
         except requests.exceptions.RequestException as e:
+            print(f"Request exception: {e}")
+            if attempt < max_retries - 1:
+                print(f"Retrying in {retry_delay} seconds...")
+                time.sleep(retry_delay)
+                retry_delay *= 2
+    print(f"No Pexels images found for query: {query} after all attempts")
+    return None
 def search_google_images(query):
+    """Search for images on Google Images (for news-related queries)"""
     try:
+        search_url = f"https://www.google.com/search?q={quote(query)}&tbm=isch"
         headers = {"User-Agent": USER_AGENT}
+        response = requests.get(search_url, headers=headers, timeout=10)
         soup = BeautifulSoup(response.text, "html.parser")
         img_tags = soup.find_all("img")
+        image_urls = []
         for img in img_tags:
+            src = img.get("src", "")
+            if src.startswith("http") and "gstatic" not in src:
+                image_urls.append(src)
         if image_urls:
+            return random.choice(image_urls[:5]) if len(image_urls) >= 5 else image_urls[0]
         else:
+            print(f"No Google Images found for query: {query}")
             return None
     except Exception as e:
+        print(f"Error in Google Images search: {e}")
         return None
+def download_image(image_url, filename):
+    """Download an image from a URL to a local file with enhanced error handling."""
     try:
+        headers = {"User-Agent": USER_AGENT}
+        print(f"Downloading image from: {image_url} to {filename}")
+        response = requests.get(image_url, headers=headers, stream=True, timeout=15)
         response.raise_for_status()
         with open(filename, 'wb') as f:
             for chunk in response.iter_content(chunk_size=8192):
                 f.write(chunk)
+        print(f"Image downloaded successfully to: {filename}")
+        try:
+            img = Image.open(filename)
+            img.verify()
+            img = Image.open(filename)
+            if img.mode != 'RGB':
+                img = img.convert('RGB')
+                img.save(filename)
+            print(f"Image validated and processed: {filename}")
+            return filename
+        except Exception as e_validate:
+            print(f"Downloaded file is not a valid image: {e_validate}")
+            if os.path.exists(filename):
                 os.remove(filename)
+            return None
+    except requests.exceptions.RequestException as e_download:
+        print(f"Image download error: {e_download}")
+        if os.path.exists(filename):
+            os.remove(filename)
+        return None
+    except Exception as e_general:
+        print(f"General error during image processing: {e_general}")
         if os.path.exists(filename):
             os.remove(filename)
         return None
+def download_video(video_url, filename):
+    """Download a video from a URL to a local file."""
+    try:
+        response = requests.get(video_url, stream=True, timeout=30)
+        response.raise_for_status()
+        with open(filename, 'wb') as f:
+            for chunk in response.iter_content(chunk_size=8192):
+                f.write(chunk)
+        print(f"Video downloaded successfully to: {filename}")
+        return filename
     except Exception as e:
+        print(f"Video download error: {e}")
         if os.path.exists(filename):
             os.remove(filename)
         return None
+def generate_media(prompt, user_image=None, current_index=0, total_segments=1):
+    """
+    Generate a visual asset by first searching for a video or using a specific search strategy.
+    For news-related queries, use Google Images.
+    Returns a dict: {'path': <file_path>, 'asset_type': 'video' or 'image'}.
+    """
     safe_prompt = re.sub(r'[^\w\s-]', '', prompt).strip().replace(' ', '_')
+    if "news" in prompt.lower():
+        print(f"News-related query detected: {prompt}. Using Google Images...")
+        image_file = os.path.join(TEMP_FOLDER, f"{safe_prompt}_news.jpg")
+        image_url = search_google_images(prompt)
+        if image_url:
+            downloaded_image = download_image(image_url, image_file)
+            if downloaded_image:
+                print(f"News image saved to {downloaded_image}")
+                return {"path": downloaded_image, "asset_type": "image"}
+        else:
+            print(f"Google Images search failed for prompt: {prompt}")
+    if random.random() < 0.25:
         video_file = os.path.join(TEMP_FOLDER, f"{safe_prompt}_video.mp4")
+        video_url = search_pexels_videos(prompt, PEXELS_API_KEY)
+        if video_url:
+            downloaded_video = download_video(video_url, video_file)
+            if downloaded_video:
+                print(f"Video asset saved to {downloaded_video}")
+                return {"path": downloaded_video, "asset_type": "video"}
         else:
+            print(f"Pexels video search failed for prompt: {prompt}")
+    image_file = os.path.join(TEMP_FOLDER, f"{safe_prompt}.jpg")
+    image_url = search_pexels_images(prompt, PEXELS_API_KEY)
     if image_url:
+        downloaded_image = download_image(image_url, image_file)
+        if downloaded_image:
+            print(f"Image asset saved to {downloaded_image}")
+            return {"path": downloaded_image, "asset_type": "image"}
         else:
+            print(f"Pexels image download failed for prompt: {prompt}")
+    fallback_terms = ["nature", "people", "landscape", "technology", "business"]
     for term in fallback_terms:
+        print(f"Trying fallback image search with term: {term}")
+        fallback_file = os.path.join(TEMP_FOLDER, f"fallback_{term}.jpg")
+        fallback_url = search_pexels_images(term, PEXELS_API_KEY)
         if fallback_url:
+            downloaded_fallback = download_image(fallback_url, fallback_file)
+            if downloaded_fallback:
+                print(f"Fallback image saved to {downloaded_fallback}")
+                return {"path": downloaded_fallback, "asset_type": "image"}
             else:
+                print(f"Fallback image download failed for term: {term}")
+        else:
+            print(f"Fallback image search failed for term: {term}")
+    print(f"Failed to generate visual asset for prompt: {prompt}")
+    return None
+def generate_silent_audio(duration, sample_rate=24000):
+    """Generate a silent WAV audio file lasting 'duration' seconds."""
+    num_samples = int(duration * sample_rate)
+    silence = np.zeros(num_samples, dtype=np.float32)
+    silent_path = os.path.join(TEMP_FOLDER, f"silent_{int(time.time())}.wav")
+    sf.write(silent_path, silence, sample_rate)
+    print(f"Silent audio generated: {silent_path}")
+    return silent_path
+def generate_tts(text, voice):
+    """
+    Generate TTS audio using Kokoro, falling back to gTTS or silent audio if needed.
+    """
+    safe_text = re.sub(r'[^\w\s-]', '', text[:10]).strip().replace(' ', '_')
+    file_path = os.path.join(TEMP_FOLDER, f"tts_{safe_text}.wav")
+    if os.path.exists(file_path):
+        print(f"Using cached TTS for text '{text[:10]}...'")
+        return file_path
     try:
+        kokoro_voice = 'af_heart' if voice == 'en' else voice
+        generator = pipeline(text, voice=kokoro_voice, speed=0.9, split_pattern=r'\n+')
+        audio_segments = []
+        for i, (gs, ps, audio) in enumerate(generator):
+            audio_segments.append(audio)
+        full_audio = np.concatenate(audio_segments) if len(audio_segments) > 1 else audio_segments[0]
+        sf.write(file_path, full_audio, 24000)
+        print(f"TTS audio saved to {file_path} (Kokoro)")
         return file_path
     except Exception as e:
+        print(f"Error with Kokoro TTS: {e}")
         try:
+            print("Falling back to gTTS...")
+            tts = gTTS(text=text, lang='en')
+            mp3_path = os.path.join(TEMP_FOLDER, f"tts_{safe_text}.mp3")
+            tts.save(mp3_path)
+            audio = AudioSegment.from_mp3(mp3_path)
+            audio.export(file_path, format="wav")
+            os.remove(mp3_path)
+            print(f"Fallback TTS saved to {file_path} (gTTS)")
             return file_path
+        except Exception as fallback_error:
+            print(f"Both TTS methods failed: {fallback_error}")
+            return generate_silent_audio(duration=max(3, len(text.split()) * 0.5))
+def apply_kenburns_effect(clip, target_resolution, effect_type=None):
+    """Apply a smooth Ken Burns effect with a single movement pattern."""
     target_w, target_h = target_resolution
     clip_aspect = clip.w / clip.h
     target_aspect = target_w / target_h
+    if clip_aspect > target_aspect:
         new_height = target_h
         new_width = int(new_height * clip_aspect)
+    else:
         new_width = target_w
         new_height = int(new_width / clip_aspect)
+    clip = clip.resize(newsize=(new_width, new_height))
+    base_scale = 1.15
+    new_width = int(new_width * base_scale)
+    new_height = int(new_height * base_scale)
+    clip = clip.resize(newsize=(new_width, new_height))
+    max_offset_x = new_width - target_w
+    max_offset_y = new_height - target_h
+    available_effects = ["zoom-in", "zoom-out", "pan-left", "pan-right", "up-left"]
+    if effect_type is None or effect_type == "random":
+        effect_type = random.choice(available_effects)
     if effect_type == "zoom-in":
+        start_zoom = 0.9
+        end_zoom = 1.1
+        start_center = (new_width / 2, new_height / 2)
+        end_center = start_center
     elif effect_type == "zoom-out":
+        start_zoom = 1.1
+        end_zoom = 0.9
+        start_center = (new_width / 2, new_height / 2)
+        end_center = start_center
     elif effect_type == "pan-left":
+        start_zoom = 1.0
+        end_zoom = 1.0
+        start_center = (max_offset_x + target_w / 2, (max_offset_y // 2) + target_h / 2)
+        end_center = (target_w / 2, (max_offset_y // 2) + target_h / 2)
     elif effect_type == "pan-right":
+        start_zoom = 1.0
+        end_zoom = 1.0
+        start_center = (target_w / 2, (max_offset_y // 2) + target_h / 2)
+        end_center = (max_offset_x + target_w / 2, (max_offset_y // 2) + target_h / 2)
+    elif effect_type == "up-left":
+        start_zoom = 1.0
+        end_zoom = 1.0
+        start_center = (max_offset_x + target_w / 2, max_offset_y + target_h / 2)
+        end_center = (target_w / 2, target_h / 2)
+    else:
+        raise ValueError(f"Unsupported effect_type: {effect_type}")
     def transform_frame(get_frame, t):
+        frame = get_frame(t)
+        ratio = t / clip.duration if clip.duration > 0 else 0
+        ratio = 0.5 - 0.5 * math.cos(math.pi * ratio)
         current_zoom = start_zoom + (end_zoom - start_zoom) * ratio
         crop_w = int(target_w / current_zoom)
         crop_h = int(target_h / current_zoom)
+        current_center_x = start_center[0] + (end_center[0] - start_center[0]) * ratio
+        current_center_y = start_center[1] + (end_center[1] - start_center[1]) * ratio
         min_center_x = crop_w / 2
+        max_center_x = new_width - crop_w / 2
         min_center_y = crop_h / 2
+        max_center_y = new_height - crop_h / 2
         current_center_x = max(min_center_x, min(current_center_x, max_center_x))
         current_center_y = max(min_center_y, min(current_center_y, max_center_y))
+        cropped_frame = cv2.getRectSubPix(frame, (crop_w, crop_h), (current_center_x, current_center_y))
+        resized_frame = cv2.resize(cropped_frame, (target_w, target_h), interpolation=cv2.INTER_LANCZOS4)
+        return resized_frame
+    return clip.fl(transform_frame)
 def resize_to_fill(clip, target_resolution):
+    """Resize and crop a clip to fill the target resolution while maintaining aspect ratio."""
     target_w, target_h = target_resolution
+    clip_aspect = clip.w / clip.h
     target_aspect = target_w / target_h
+    if clip_aspect > target_aspect:
         clip = clip.resize(height=target_h)
         crop_amount = (clip.w - target_w) / 2
+        clip = clip.crop(x1=crop_amount, x2=clip.w - crop_amount, y1=0, y2=clip.h)
     else:
         clip = clip.resize(width=target_w)
         crop_amount = (clip.h - target_h) / 2
+        clip = clip.crop(x1=0, x2=clip.w, y1=crop_amount, y2=clip.h - crop_amount)
+    return clip
+def find_mp3_files():
+    """Search for any MP3 files in the current directory and subdirectories."""
+    mp3_files = []
+    for root, dirs, files in os.walk('.'):
+        for file in files:
+            if file.endswith('.mp3'):
+                mp3_path = os.path.join(root, file)
+                mp3_files.append(mp3_path)
+                print(f"Found MP3 file: {mp3_path}")
+    return mp3_files[0] if mp3_files else None
+def add_background_music(final_video, bg_music_volume=0.08):
+    """Add background music to the final video using any MP3 file found."""
     try:
+        bg_music_path = find_mp3_files()
+        if bg_music_path and os.path.exists(bg_music_path):
+            print(f"Adding background music from: {bg_music_path}")
+            bg_music = AudioFileClip(bg_music_path)
+            if bg_music.duration < final_video.duration:
+                loops_needed = math.ceil(final_video.duration / bg_music.duration)
+                bg_segments = [bg_music] * loops_needed
+                bg_music = concatenate_audioclips(bg_segments)
+            bg_music = bg_music.subclip(0, final_video.duration)
+            bg_music = bg_music.volumex(bg_music_volume)
+            video_audio = final_video.audio
             mixed_audio = CompositeAudioClip([video_audio, bg_music])
+            final_video = final_video.set_audio(mixed_audio)
+            print("Background music added successfully")
         else:
+            print("No MP3 files found, skipping background music")
         return final_video
     except Exception as e:
         print(f"Error adding background music: {e}")
+        print("Continuing without background music")
         return final_video
 def create_clip(media_path, asset_type, tts_path, duration=None, effects=None, narration_text=None, segment_index=0):
+    """Create a video clip with synchronized subtitles and narration."""
     try:
+        print(f"Creating clip #{segment_index} with asset_type: {asset_type}, media_path: {media_path}")
+        if not os.path.exists(media_path) or not os.path.exists(tts_path):
+            print("Missing media or TTS file")
             return None
+        audio_clip = AudioFileClip(tts_path).audio_fadeout(0.2)
+        audio_duration = audio_clip.duration
+        target_duration = audio_duration + 0.2
         if asset_type == "video":
+            clip = VideoFileClip(media_path)
+            clip = resize_to_fill(clip, TARGET_RESOLUTION)
+            if clip.duration < target_duration:
+                clip = clip.loop(duration=target_duration)
+            else:
+                clip = clip.subclip(0, target_duration)
         elif asset_type == "image":
+            img = Image.open(media_path)
+            if img.mode != 'RGB':
+                with tempfile.NamedTemporaryFile(suffix='.jpg', delete=False) as temp:
+                    img.convert('RGB').save(temp.name)
+                    media_path = temp.name
+                img.close()
+            clip = ImageClip(media_path).set_duration(target_duration)
+            clip = apply_kenburns_effect(clip, TARGET_RESOLUTION)
+            clip = clip.fadein(0.3).fadeout(0.3)
         else:
+            return None
         if narration_text and CAPTION_COLOR != "transparent":
             try:
                 words = narration_text.split()
+                chunks = []
+                current_chunk = []
+                for word in words:
+                    current_chunk.append(word)
+                    if len(current_chunk) >= 5:
+                        chunks.append(' '.join(current_chunk))
+                        current_chunk = []
+                if current_chunk:
+                    chunks.append(' '.join(current_chunk))
+                chunk_duration = audio_duration / len(chunks)
+                subtitle_clips = []
+                subtitle_y_position = int(TARGET_RESOLUTION[1] * 0.70)
                 for i, chunk_text in enumerate(chunks):
                     start_time = i * chunk_duration
+                    end_time = (i + 1) * chunk_duration
                     txt_clip = TextClip(
                         chunk_text,
+                        fontsize=45,
+                        font='Arial-Bold',
                         color=CAPTION_COLOR,
+                        bg_color='rgba(0, 0, 0, 0.25)',
+                        method='caption',
                         align='center',
+                        stroke_width=2,
+                        stroke_color=CAPTION_COLOR,
+                        size=(TARGET_RESOLUTION[0] * 0.8, None)
+                    ).set_start(start_time).set_end(end_time)
+                    txt_clip = txt_clip.set_position(('center', subtitle_y_position))
                     subtitle_clips.append(txt_clip)
+                clip = CompositeVideoClip([clip] + subtitle_clips)
+            except Exception as sub_error:
+                print(f"Subtitle error: {sub_error}")
+                txt_clip = TextClip(
+                    narration_text,
+                    fontsize=28,
+                    color=CAPTION_COLOR,
+                    align='center',
+                    size=(TARGET_RESOLUTION[0] * 0.7, None)
+                ).set_position(('center', int(TARGET_RESOLUTION[1] / 3))).set_duration(clip.duration)
+                clip = CompositeVideoClip([clip, txt_clip])
         clip = clip.set_audio(audio_clip)
+        print(f"Clip created: {clip.duration:.1f}s")
         return clip
+    except Exception as e:
+        print(f"Error in create_clip: {str(e)}")
+        return None
+def fix_imagemagick_policy():
+    """Fix ImageMagick security policies."""
+    try:
+        print("Attempting to fix ImageMagick security policies...")
+        policy_paths = [
+            "/etc/ImageMagick-6/policy.xml",
+            "/etc/ImageMagick-7/policy.xml",
+            "/etc/ImageMagick/policy.xml",
+            "/usr/local/etc/ImageMagick-7/policy.xml"
+        ]
+        found_policy = next((path for path in policy_paths if os.path.exists(path)), None)
+        if not found_policy:
+            print("No policy.xml found. Using alternative subtitle method.")
+            return False
+        print(f"Modifying policy file at {found_policy}")
+        os.system(f"sudo cp {found_policy} {found_policy}.bak")
+        os.system(f"sudo sed -i 's/rights=\"none\"/rights=\"read|write\"/g' {found_policy}")
+        os.system(f"sudo sed -i 's/<policy domain=\"path\" pattern=\"@\*\"[^>]*>/<policy domain=\"path\" pattern=\"@*\" rights=\"read|write\"/g' {found_policy}")
+        os.system(f"sudo sed -i 's/<policy domain=\"coder\" rights=\"none\" pattern=\"PDF\"[^>]*>/<!-- <policy domain=\"coder\" rights=\"none\" pattern=\"PDF\"> -->/g' {found_policy}")
+        print("ImageMagick policies updated successfully.")
+        return True
     except Exception as e:
+        print(f"Error fixing policies: {e}")
+        return False
+# ---------------- Main Function with Gradio Integration ---------------- #
+def generate_video(user_input, resolution, caption_option):
+    """Generate a video based on user input via Gradio."""
+    global TARGET_RESOLUTION, CAPTION_COLOR, TEMP_FOLDER
+    import shutil
+    # Set resolution
+    if resolution == "Full":
         TARGET_RESOLUTION = (1920, 1080)
+    elif resolution == "Short":
+        TARGET_RESOLUTION = (1080, 1920)
+    else:
+        TARGET_RESOLUTION = (1920, 1080)  # Default
+    # Set caption color
+    CAPTION_COLOR = "white" if caption_option == "Yes" else "transparent"
+    # Create a unique temporary folder
+    TEMP_FOLDER = tempfile.mkdtemp()
+    # Fix ImageMagick policy
+    fix_success = fix_imagemagick_policy()
+    if not fix_success:
+        print("Will use alternative methods if needed")
+    print("Generating script from API...")
+    script = generate_script(user_input)
+    if not script:
+        print("Failed to generate script.")
+        shutil.rmtree(TEMP_FOLDER)
+        return None
+    print("Generated Script:\n", script)
     elements = parse_script(script)
     if not elements:
+        print("Failed to parse script into elements.")
+        shutil.rmtree(TEMP_FOLDER)
+        return None
+    print(f"Parsed {len(elements)//2} script segments.")
     paired_elements = []
+    for i in range(0, len(elements), 2):
+        if i + 1 < len(elements):
+            paired_elements.append((elements[i], elements[i + 1]))
     if not paired_elements:
+        print("No valid script segments found.")
+        shutil.rmtree(TEMP_FOLDER)
+        return None
     clips = []
     for idx, (media_elem, tts_elem) in enumerate(paired_elements):
+        print(f"\nProcessing segment {idx+1}/{len(paired_elements)} with prompt: '{media_elem['prompt']}'")
+        media_asset = generate_media(media_elem['prompt'], current_index=idx, total_segments=len(paired_elements))
+        if not media_asset:
+            print(f"Skipping segment {idx+1} due to missing media asset.")
+            continue
         tts_path = generate_tts(tts_elem['text'], tts_elem['voice'])
         if not tts_path:
+            print(f"Skipping segment {idx+1} due to TTS generation failure.")
+            continue
         clip = create_clip(
             media_path=media_asset['path'],
             asset_type=media_asset['asset_type'],
             tts_path=tts_path,
+            duration=tts_elem['duration'],
+            effects=media_elem.get('effects', 'fade-in'),
             narration_text=tts_elem['text'],
             segment_index=idx
         )
         if clip:
             clips.append(clip)
         else:
+            print(f"Clip creation failed for segment {idx+1}.")
     if not clips:
+        print("No clips were successfully created.")
         shutil.rmtree(TEMP_FOLDER)
+        return None
+    print("\nConcatenating clips...")
+    final_video = concatenate_videoclips(clips, method="compose")
+    final_video = add_background_music(final_video, bg_music_volume=0.08)
+    print(f"Exporting final video to {OUTPUT_VIDEO_FILENAME}...")
+    final_video.write_videofile(OUTPUT_VIDEO_FILENAME, codec='libx264', fps=24, preset='veryfast')
+    print(f"Final video saved as {OUTPUT_VIDEO_FILENAME}")
+    # Clean up
+    print("Cleaning up temporary files...")
+    shutil.rmtree(TEMP_FOLDER)
+    print("Temporary files removed.")
     return OUTPUT_VIDEO_FILENAME
+# ---------------- Gradio Interface ---------------- #
+iface = gr.Interface(
+    fn=generate_video,
+    inputs=[
+        gr.Textbox(label="Video Concept", placeholder="Enter your video concept here..."),
+        gr.Radio(["Full", "Short"], label="Resolution", value="Full"),
+        gr.Radio(["Yes", "No"], label="Captions", value="Yes")
+    ],
+    outputs=gr.Video(label="Generated Video"),
+    title="AI Documentary Video Generator",
+    description="Create a funny documentary-style video based on your concept. Note: Generation may take several minutes on CPU."
+)
+# Launch the interface
+iface.launch(share=True)