Spaces:

mgbam
/

ChronoWeave

Sleeping

File size: 45,286 Bytes

62f88b4
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
3c37f6f
 
 
62f88b4
 
 
3c37f6f
 
 
62f88b4
 
3c37f6f
09b00d7
62f88b4
 
 
 
 
 
 
 
3c37f6f
 
 
 
62f88b4
3c37f6f
 
62f88b4
3c37f6f
 
62f88b4
 
 
3c37f6f
 
 
09b00d7
 
3c37f6f
 
 
 
 
 
 
 
 
 
62f88b4
 
3c37f6f
62f88b4
3c37f6f
62f88b4
3c37f6f
62f88b4
3c37f6f
 
 
 
 
 
 
 
 
 
09b00d7
3c37f6f
 
 
62f88b4
3c37f6f
09b00d7
62f88b4
09b00d7
62f88b4
09b00d7
62f88b4
09b00d7
3c37f6f
 
 
09b00d7
 
 
 
 
 
 
 
 
 
 
 
 
62f88b4
3c37f6f
 
62f88b4
 
 
3c37f6f
 
 
 
 
 
 
 
 
 
 
09b00d7
3c37f6f
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
62f88b4
 
 
 
3c37f6f
 
 
 
 
62f88b4
3c37f6f
62f88b4
 
3c37f6f
 
 
 
 
09b00d7
 
 
 
3c37f6f
 
 
 
09b00d7
3c37f6f
 
62f88b4
3c37f6f
 
62f88b4
 
09b00d7
62f88b4
3c37f6f
09b00d7
3c37f6f
 
09b00d7
3c37f6f
62f88b4
3c37f6f
09b00d7
3c37f6f
 
 
 
 
 
 
09b00d7
62f88b4
3c37f6f
62f88b4
3c37f6f
62f88b4
3c37f6f
09b00d7
3c37f6f
 
 
62f88b4
 
3c37f6f
 
 
 
 
 
 
 
62f88b4
3c37f6f
 
 
 
 
62f88b4
09b00d7
3c37f6f
 
62f88b4
 
 
3c37f6f
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
09b00d7
3c37f6f
09b00d7
62f88b4
 
09b00d7
62f88b4
 
 
3c37f6f
 
62f88b4
 
 
3c37f6f
 
 
 
 
09b00d7
3c37f6f
 
 
 
 
 
 
09b00d7
 
 
 
 
 
 
62f88b4
3c37f6f
 
09b00d7
3c37f6f
 
 
 
 
 
 
 
 
 
62f88b4
3c37f6f
 
 
 
62f88b4
3c37f6f
 
 
 
62f88b4
 
 
3c37f6f
 
 
 
 
 
 
 
 
 
 
09b00d7
3c37f6f
 
 
62f88b4
3c37f6f
62f88b4
3c37f6f
62f88b4
3c37f6f
09b00d7
62f88b4
09b00d7
 
62f88b4
 
3c37f6f
09b00d7
 
 
 
 
 
 
 
 
 
 
 
 
 
3c37f6f
 
 
09b00d7
 
 
 
 
 
 
 
3c37f6f
 
 
 
 
62f88b4
3c37f6f
09b00d7
 
 
 
 
3c37f6f
 
 
62f88b4
3c37f6f
 
09b00d7
3c37f6f
62f88b4
 
3c37f6f
09b00d7
 
3c37f6f
 
62f88b4
3c37f6f
 
62f88b4
 
 
 
3c37f6f
62f88b4
09b00d7
62f88b4
3c37f6f
62f88b4
09b00d7
62f88b4
3c37f6f
 
 
 
 
 
 
 
 
 
 
 
09b00d7
62f88b4
3c37f6f
62f88b4
 
3c37f6f
09b00d7
3c37f6f
62f88b4
 
 
 
3c37f6f
62f88b4
 
3c37f6f
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
62f88b4
 
3c37f6f
 
 
 
 
 
 
09b00d7
3c37f6f
 
 
09b00d7
3c37f6f
 
 
 
 
 
09b00d7
3c37f6f
 
 
 
 
 
 
 
 
 
 
 
09b00d7
3c37f6f
 
 
 
09b00d7
62f88b4
 
3c37f6f
 
 
 
 
 
 
 
 
 
62f88b4
3c37f6f
 
 
09b00d7
3c37f6f
 
 
09b00d7
3c37f6f
 
 
09b00d7
3c37f6f
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
09b00d7
3c37f6f
 
 
 
 
 
 
 
 
 
 
 
09b00d7
 
 
 
 
3c37f6f
 
 
 
09b00d7
3c37f6f
09b00d7
3c37f6f
09b00d7
 
 
 
3c37f6f
09b00d7
3c37f6f
 
 
 
 
 
09b00d7
 
 
 
 
 
3c37f6f
 
 
 
 
09b00d7
 
 
3c37f6f
 
 
 
 
62f88b4
09b00d7
62f88b4
3c37f6f
 
 
 
 
 
 
62f88b4
3c37f6f
 
62f88b4
 
3c37f6f
 
62f88b4
3c37f6f
 
09b00d7
 
 
3c37f6f
09b00d7
 
 
3c37f6f
09b00d7
3c37f6f
 
09b00d7
3c37f6f
09b00d7
3c37f6f
 
62f88b4
3c37f6f
 
 
 
09b00d7
 
 
 
3c37f6f
 
09b00d7
3c37f6f
09b00d7
3c37f6f
 
62f88b4
 
3c37f6f
62f88b4
3c37f6f
 
 
09b00d7
3c37f6f
09b00d7
3c37f6f
09b00d7
3c37f6f
 
 
62f88b4
3c37f6f
 
62f88b4
 
09b00d7
 
 
3c37f6f
 
09b00d7
62f88b4
3c37f6f
 
09b00d7
3c37f6f
 
 
 
 
 
 
 
 
 
 
 
09b00d7
 
3c37f6f
 
 
 
 
 
 
 
 
 
 
 
 
62f88b4
3c37f6f
09b00d7
3c37f6f
 
 
09b00d7
 
 
 
 
 
3c37f6f
 
09b00d7
62f88b4
 
3c37f6f
 
62f88b4
3c37f6f
 
62f88b4
3c37f6f
09b00d7
3c37f6f
62f88b4
09b00d7
3c37f6f
 
62f88b4
 
3c37f6f

# Copyright 2025 Google LLC. Based on work by Yousif Ahmed.
# Concept: ChronoWeave - Branching Narrative Generation
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at http://www.apache.org/licenses/LICENSE-2.0

import streamlit as st
import google.generativeai as genai
import os
import json
import numpy as np
from io import BytesIO
import time
import wave
import contextlib
import asyncio
import uuid # For unique identifiers
import shutil # For directory operations
import logging # For better logging

# Image handling
from PIL import Image
# Pydantic for data validation
from pydantic import BaseModel, Field, ValidationError, validator
from typing import List, Optional, Literal

# Video and audio processing
from moviepy.editor import ImageClip, AudioFileClip, concatenate_videoclips
# from moviepy.config import change_settings # Potential for setting imagemagick path if needed

# Type hints
import typing_extensions as typing

# Async support for Streamlit/Google API
import nest_asyncio
nest_asyncio.apply() # Apply patch for asyncio in environments like Streamlit/Jupyter

# --- Logging Setup ---
logging.basicConfig(level=logging.INFO, format='%(asctime)s - %(levelname)s - %(message)s')
logger = logging.getLogger(__name__)

# --- Configuration ---
st.set_page_config(page_title="ChronoWeave", layout="wide", initial_sidebar_state="expanded")
st.title("🌀 ChronoWeave: Advanced Branching Narrative Generator")
st.markdown("""
Generate multiple, branching story timelines from a single theme using AI, complete with images and narration.
*Based on the work of Yousif Ahmed. Copyright 2025 Google LLC.*
""")

# --- Constants ---
# Text/JSON Model
TEXT_MODEL_ID = "models/gemini-1.5-flash" # Or "gemini-1.5-pro" for potentially higher quality/cost
# Audio Model Config
AUDIO_API_VERSION = 'v1alpha' # Required for audio modality (though endpoint set implicitly now)
AUDIO_MODEL_ID = f"models/gemini-1.5-flash" # Model used for audio tasks
AUDIO_SAMPLING_RATE = 24000 # Standard for TTS models like Google's
# Image Model Config
IMAGE_MODEL_ID = "imagen-3" # Or specific version like "imagen-3.0-generate-002"
DEFAULT_ASPECT_RATIO = "1:1"
# Video Config
VIDEO_FPS = 24
VIDEO_CODEC = "libx264" # Widely compatible H.264
AUDIO_CODEC = "aac" # Common audio codec for MP4
# File Management
TEMP_DIR_BASE = ".chrono_temp" # Base name for temporary directories

# --- API Key Handling ---
GOOGLE_API_KEY = None
try:
    # Preferred way: Use Streamlit secrets when deployed
    GOOGLE_API_KEY = st.secrets["GOOGLE_API_KEY"]
    logger.info("Google API Key loaded from Streamlit secrets.")
except KeyError:
    # Fallback: Check environment variable (useful for local development)
    GOOGLE_API_KEY = os.environ.get('GOOGLE_API_KEY')
    if GOOGLE_API_KEY:
        logger.info("Google API Key loaded from environment variable.")
    else:
        # Error if neither is found
        st.error(
            "🚨 **Google API Key Not Found!**\n"
            "Please configure your Google API Key:\n"
            "1.  **Streamlit Cloud/Hugging Face Spaces:** Add it as a Secret named `GOOGLE_API_KEY` in your app's settings.\n"
            "2.  **Local Development:** Set the `GOOGLE_API_KEY` environment variable or create a `.streamlit/secrets.toml` file.",
            icon="🚨"
        )
        st.stop() # Halt execution

# --- Initialize Google Clients ---
# CORRECTED SECTION: Uses genai.GenerativeModel for both models
try:
    # Configure globally
    genai.configure(api_key=GOOGLE_API_KEY)
    logger.info("Configured google-generativeai with API key.")

    # Model/Client Handle for Text/Imagen Generation
    client_standard = genai.GenerativeModel(TEXT_MODEL_ID)
    logger.info(f"Initialized standard GenerativeModel for {TEXT_MODEL_ID}.")

    # Model Handle for Audio Generation
    # Use the standard GenerativeModel initialization.
    # The necessary methods (like .connect) are part of this object.
    live_model = genai.GenerativeModel(AUDIO_MODEL_ID) # Use GenerativeModel here
    logger.info(f"Initialized GenerativeModel handle for audio ({AUDIO_MODEL_ID}).")
    # We no longer use or need 'client_live' or explicit endpoint setting here.
    # The audio config is handled within the generate_audio_live_async function.

except AttributeError as ae:
     # Keep this specific error catch just in case library structure is very old/unexpected
     logger.exception("AttributeError during Google AI Client Initialization.")
     st.error(f"🚨 Failed to initialize Google AI Clients due to an unexpected library structure error: {ae}. Please ensure 'google-generativeai' is up-to-date.", icon="🚨")
     st.stop()
except Exception as e:
    logger.exception("Failed to initialize Google AI Clients.")
    st.error(f"🚨 Failed to initialize Google AI Clients: {e}", icon="🚨")
    st.stop()


# --- Define Pydantic Schemas for Robust Validation ---
class StorySegment(BaseModel):
    scene_id: int = Field(..., ge=0, description="Scene number within the timeline, starting from 0.")
    image_prompt: str = Field(..., min_length=10, max_length=150, description="Concise visual description for image generation (15-35 words). Focus on non-human characters, setting, action, style.")
    audio_text: str = Field(..., min_length=5, max_length=150, description="Single sentence of narration/dialogue for the scene (max 30 words).")
    character_description: str = Field(..., max_length=100, description="Brief description of key non-human characters/objects in *this* scene's prompt for consistency.")
    timeline_visual_modifier: Optional[str] = Field(None, max_length=50, description="Optional subtle visual style hint (e.g., 'slightly darker', 'more vibrant colors').")

    @validator('image_prompt')
    def image_prompt_no_humans(cls, v):
        if any(word in v.lower() for word in ["person", "people", "human", "man", "woman", "boy", "girl", "child"]):
            logger.warning(f"Image prompt '{v[:50]}...' may contain human descriptions. Relying on API-level controls & prompt instructions.")
        return v

class Timeline(BaseModel):
    timeline_id: int = Field(..., ge=0, description="Unique identifier for this timeline.")
    divergence_reason: str = Field(..., min_length=5, description="Clear reason why this timeline branched off.")
    segments: List[StorySegment] = Field(..., min_items=1, description="List of scenes composing this timeline.")

class ChronoWeaveResponse(BaseModel):
    core_theme: str = Field(..., min_length=5, description="The central theme provided by the user.")
    timelines: List[Timeline] = Field(..., min_items=1, description="List of generated timelines.")
    total_scenes_per_timeline: int = Field(..., gt=0, description="The requested number of scenes per timeline.")

    @validator('timelines')
    def check_timeline_segment_count(cls, timelines, values):
        if 'total_scenes_per_timeline' in values:
            expected_scenes = values['total_scenes_per_timeline']
            for i, timeline in enumerate(timelines):
                if len(timeline.segments) != expected_scenes:
                    raise ValueError(f"Timeline {i} (ID: {timeline.timeline_id}) has {len(timeline.segments)} segments, but expected {expected_scenes}.")
        return timelines

# --- Helper Functions ---

@contextlib.contextmanager
def wave_file_writer(filename: str, channels: int = 1, rate: int = AUDIO_SAMPLING_RATE, sample_width: int = 2):
    """Context manager to safely write WAV files."""
    wf = None
    try:
        wf = wave.open(filename, "wb")
        wf.setnchannels(channels)
        wf.setsampwidth(sample_width) # 2 bytes for 16-bit audio
        wf.setframerate(rate)
        yield wf
    except Exception as e:
        logger.error(f"Error opening/configuring wave file {filename}: {e}")
        raise # Re-raise the exception
    finally:
        if wf:
            try:
                wf.close()
            except Exception as e_close:
                logger.error(f"Error closing wave file {filename}: {e_close}")


async def generate_audio_live_async(api_text: str, output_filename: str, voice: Optional[str] = None) -> Optional[str]:
    """
    Generates audio using Gemini Live API (async version) via the GenerativeModel.
    Returns the path to the generated audio file or None on failure.
    """
    collected_audio = bytearray()
    task_id = os.path.basename(output_filename).split('.')[0] # Extract T#_S# for logging
    logger.info(f"🎙️ [{task_id}] Requesting audio for: '{api_text[:60]}...'")

    try:
        # Use the 'live_model' (a GenerativeModel instance) initialized earlier.
        config = {
            "response_modalities": ["AUDIO"],
            "audio_config": {
                "audio_encoding": "LINEAR16", # Required format for WAV output
                "sample_rate_hertz": AUDIO_SAMPLING_RATE,
                # "voice": voice if voice else "aura-asteria-en" # Optional: Specify voice if needed and available
            }
        }

        # Prepend directive to discourage conversational filler
        directive_prompt = (
            "Narrate the following sentence directly and engagingly. "
            "Do not add any introductory or concluding remarks like 'Okay', 'Sure', or 'Here is the narration'. "
            "Speak only the sentence itself:\n\n"
            f'"{api_text}"'
        )

        # Connect and stream using the GenerativeModel instance
        async with live_model.connect(config=config) as session:
            await session.send_request([directive_prompt])
            async for response in session.stream_content():
                if response.audio_chunk and response.audio_chunk.data:
                    collected_audio.extend(response.audio_chunk.data)
                # Handle potential errors within the stream if the API provides them
                if hasattr(response, 'error') and response.error:
                     logger.error(f"   ❌ [{task_id}] Error during audio stream: {response.error}")
                     st.error(f"Audio stream error for scene {task_id}: {response.error}", icon="🔊")
                     return None # Stop processing this audio request

        if not collected_audio:
            logger.warning(f"⚠️ [{task_id}] No audio data received for: '{api_text[:60]}...'")
            st.warning(f"No audio data generated for scene {task_id}.", icon="🔊")
            return None

        # Write the collected audio bytes into a WAV file using the context manager.
        with wave_file_writer(output_filename, rate=AUDIO_SAMPLING_RATE) as wf:
            wf.writeframes(bytes(collected_audio))
        logger.info(f"   ✅ [{task_id}] Audio saved: {os.path.basename(output_filename)} ({len(collected_audio)} bytes)")
        return output_filename

    except genai.types.generation_types.BlockedPromptException as bpe:
         logger.error(f"   ❌ [{task_id}] Audio generation blocked for prompt '{api_text[:60]}...': {bpe}")
         st.error(f"Audio generation blocked for scene {task_id} due to safety settings.", icon="🔇")
         return None
    except Exception as e:
        # Catch other potential errors during connect/send/stream
        logger.exception(f"   ❌ [{task_id}] Audio generation failed unexpectedly for '{api_text[:60]}...': {e}")
        st.error(f"Audio generation failed for scene {task_id}: {e}", icon="🔊")
        return None


def generate_story_sequence_chrono(
    theme: str,
    num_scenes: int,
    num_timelines: int,
    divergence_prompt: str = ""
) -> Optional[ChronoWeaveResponse]:
    """
    Generates branching story sequences using Gemini structured output and validates with Pydantic.
    Returns a validated Pydantic object or None on failure.
    """
    st.info(f"📚 Generating {num_timelines} timeline(s) x {num_scenes} scenes for theme: '{theme}'...")
    logger.info(f"Requesting story structure: Theme='{theme}', Timelines={num_timelines}, Scenes={num_scenes}")

    divergence_instruction = (
        f"Introduce clear points of divergence between timelines, starting potentially after the first scene. "
        f"If provided, use this hint for divergence: '{divergence_prompt}'. "
        f"Clearly state the divergence reason for each timeline (except potentially the first)."
    )

    prompt = f"""
    Act as an expert narrative designer specializing in short, visual, branching stories for children.
    Create a story based on the core theme: "{theme}".

    **Instructions:**
    1.  Generate exactly **{num_timelines}** distinct timelines.
    2.  Each timeline must contain exactly **{num_scenes}** sequential scenes.
    3.  **Crucially, DO NOT include any humans, people, or humanoid figures** in the descriptions or actions. Focus strictly on animals, fantasy creatures, animated objects, or natural elements.
    4.  {divergence_instruction}
    5.  Maintain a consistent visual style across all scenes and timelines: **'Simple, friendly kids animation style with bright colors and rounded shapes'**, unless a `timeline_visual_modifier` subtly alters it.
    6.  Each scene's narration (`audio_text`) should be a single, concise sentence (approx. 5-10 seconds spoken length, max 30 words).
    7.  Image prompts (`image_prompt`) should be descriptive (15-35 words), focusing on the non-human character(s), setting, action, and visual style. Explicitly mention the main character(s) for consistency.
    8.  `character_description` should briefly describe recurring non-human characters mentioned *in the specific scene's image prompt* (name, key visual features). Keep consistent within a timeline.

    **Output Format:**
    Respond ONLY with a valid JSON object adhering strictly to the provided schema. Do not include any text before or after the JSON object.

    **JSON Schema:**
    ```json
    {json.dumps(ChronoWeaveResponse.schema(), indent=2)}
    ```
    """ # Using .schema() which is the Pydantic v1 way, adjust if using v2 (.model_json_schema())

    try:
        # Use the standard client (GenerativeModel instance) for text generation
        response = client_standard.generate_content(
            contents=prompt,
            generation_config=genai.types.GenerationConfig(
                response_mime_type="application/json",
                temperature=0.7 # Add some creativity
            )
        )

        # Debugging: Log raw response
        # logger.debug(f"Raw Gemini Response Text:\n{response.text}")

        # Attempt to parse the JSON
        try:
            # Use response.text which should contain the JSON string
            raw_data = json.loads(response.text)
        except json.JSONDecodeError as json_err:
            logger.error(f"Failed to decode JSON response: {json_err}")
            logger.error(f"Problematic Response Text:\n{response.text}")
            st.error(f"🚨 Failed to parse the story structure from the AI. Error: {json_err}", icon="📄")
            st.text_area("Problematic AI Response:", response.text, height=200)
            return None
        except Exception as e:
             logger.error(f"Error accessing or decoding response text: {e}")
             st.error(f"🚨 Error processing AI response: {e}", icon="📄")
             # Log the response object itself if possible
             # logger.debug(f"Response object: {response}")
             return None


        # Validate the parsed data using Pydantic
        try:
            # Use parse_obj for Pydantic v1, or YourModel.model_validate(raw_data) for v2
            validated_data = ChronoWeaveResponse.parse_obj(raw_data)
            logger.info("✅ Story structure generated and validated successfully!")
            st.success("✅ Story structure generated and validated!")
            return validated_data
        except ValidationError as val_err:
            logger.error(f"JSON structure validation failed: {val_err}")
            logger.error(f"Received Data:\n{json.dumps(raw_data, indent=2)}")
            st.error(f"🚨 The generated story structure is invalid: {val_err}", icon="🧬")
            st.json(raw_data) # Show the invalid structure
            return None

    except genai.types.generation_types.BlockedPromptException as bpe:
         logger.error(f"Story generation prompt blocked: {bpe}")
         st.error("🚨 The story generation prompt was blocked, likely due to safety filters. Try rephrasing the theme.", icon="🚫")
         return None
    except Exception as e:
        logger.exception("Error during story sequence generation:")
        st.error(f"🚨 An unexpected error occurred during story generation: {e}", icon="💥")
        # Optional: Show the prompt that failed (be mindful of length/PII)
        # st.text_area("Failed Prompt (excerpt):", prompt[:500]+"...", height=150)
        return None


def generate_image_imagen(prompt: str, aspect_ratio: str = "1:1", task_id: str = "IMG") -> Optional[Image.Image]:
    """
    Generates an image using Imagen via the standard client with specific controls.
    Returns a PIL Image object or None on failure.
    """
    logger.info(f"🖼️ [{task_id}] Requesting image for: '{prompt[:70]}...' (Aspect: {aspect_ratio})")

    # Refined prompt incorporating negative constraints and style guidance
    full_prompt = (
        f"Generate an image in a child-friendly, simple animation style with bright colors and rounded shapes. "
        f"Ensure absolutely NO humans or human-like figures are present. Focus on animals or objects. "
        f"Aspect ratio should be {aspect_ratio}. " # Explicitly state aspect ratio in prompt too
        f"Prompt: {prompt}"
    )

    try:
        # Use the standard client's generate_content method.
        response = client_standard.generate_content(
            full_prompt,
             generation_config=genai.types.GenerationConfig(
                 candidate_count=1,
                 # Add other config like temperature if desired
             ),
             # Safety settings can be adjusted here if necessary and permitted
             # safety_settings={'HARM_CATEGORY_DANGEROUS_CONTENT': 'BLOCK_NONE'} # Use cautiously
        )

        # Check for valid response and image data
        # Accessing image data might depend slightly on the exact API response structure
        # common pattern is response.candidates[0].content.parts[0].inline_data.data
        # or directly response.parts if simpler structure
        image_bytes = None
        if response.candidates and response.candidates[0].content and response.candidates[0].content.parts:
             part = response.candidates[0].content.parts[0]
             if hasattr(part, 'inline_data') and part.inline_data and hasattr(part.inline_data,'data'):
                  image_bytes = part.inline_data.data
             elif hasattr(part, 'file_data') and part.file_data: # Handle potential file URIs if API changes
                  logger.warning(f"   ⚠️ [{task_id}] Received file URI instead of inline data. Handling not implemented.")
                  # Potentially download from part.file_data.file_uri here
                  return None # Or implement download

        if image_bytes:
            try:
                image = Image.open(BytesIO(image_bytes))
                logger.info(f"   ✅ [{task_id}] Image generated successfully.")
                # Check safety feedback even on success
                safety_ratings = getattr(response.candidates[0], 'safety_ratings', [])
                if safety_ratings:
                    filtered_ratings = [f"{r.category.name}: {r.probability.name}" for r in safety_ratings if r.probability.name != 'NEGLIGIBLE']
                    if filtered_ratings:
                        logger.warning(f"   ⚠️ [{task_id}] Image generated but flagged by safety filters: {', '.join(filtered_ratings)}.")
                        st.warning(f"Image for scene {task_id} flagged by safety filters: {', '.join(filtered_ratings)}", icon="⚠️")

                return image
            except Exception as img_err:
                logger.error(f"   ❌ [{task_id}] Failed to decode generated image data: {img_err}")
                st.warning(f"Failed to decode image data for scene {task_id}.", icon="🖼️")
                return None
        else:
            # Check for blocking or other issues
            block_reason = None
            prompt_feedback = getattr(response, 'prompt_feedback', None)
            if prompt_feedback:
                block_reason = getattr(prompt_feedback, 'block_reason', None)

            if block_reason:
                 logger.warning(f"   ⚠️ [{task_id}] Image generation blocked. Reason: {block_reason}. Prompt: '{prompt[:70]}...'")
                 st.warning(f"Image generation blocked for scene {task_id}. Reason: {block_reason}", icon="🚫")
            else:
                 logger.warning(f"   ⚠️ [{task_id}] No image data received, unknown reason. Prompt: '{prompt[:70]}...'")
                 st.warning(f"No image data received for scene {task_id}, reason unclear.", icon="🖼️")
                 # Log the full response for debugging
                 # logger.debug(f"Full Imagen response object: {response}")
            return None

    except genai.types.generation_types.BlockedPromptException as bpe:
         # This might be caught by the block_reason check above, but good to have explicit catch
         logger.error(f"   ❌ [{task_id}] Image generation blocked (exception): {bpe}")
         st.error(f"Image generation blocked for scene {task_id} due to safety settings.", icon="🚫")
         return None
    except Exception as e:
        logger.exception(f"   ❌ [{task_id}] Image generation failed unexpectedly for '{prompt[:70]}...': {e}")
        st.error(f"Image generation failed for scene {task_id}: {e}", icon="🖼️")
        return None


# --- Streamlit UI Elements ---
st.sidebar.header("⚙️ Configuration")

# API Key Status
if GOOGLE_API_KEY:
    st.sidebar.success("Google API Key Loaded", icon="✅")
else:
    st.sidebar.error("Google API Key Missing!", icon="🚨") # Should not be reached if st.stop() works

# Story Parameters
theme = st.sidebar.text_input("📖 Story Theme:", "A curious squirrel finds a mysterious, glowing acorn")
num_scenes = st.sidebar.slider("🎬 Scenes per Timeline:", min_value=2, max_value=7, value=3, help="Number of scenes (image+narration) in each timeline.")
num_timelines = st.sidebar.slider("🌿 Number of Timelines:", min_value=1, max_value=4, value=2, help="Number of parallel storylines to generate.")
divergence_prompt = st.sidebar.text_input("↔️ Divergence Hint (Optional):", placeholder="e.g., What if a bird tried to steal it?", help="A suggestion for how the timelines might differ.")

# Generation Settings
st.sidebar.subheader("🎨 Visual & Audio Settings")
aspect_ratio = st.sidebar.selectbox("🖼️ Image Aspect Ratio:", ["1:1", "16:9", "9:16"], index=0, help="Aspect ratio for generated images.")
# Add audio voice selection if API supports it and voices are known
# available_voices = ["aura-asteria-en", "aura-luna-en", "aura-stella-en"] # Example
# audio_voice = st.sidebar.selectbox("🗣️ Narration Voice:", available_voices, index=0)
audio_voice = None # Placeholder

generate_button = st.sidebar.button("✨ Generate ChronoWeave ✨", type="primary", disabled=(not GOOGLE_API_KEY), use_container_width=True)

st.sidebar.markdown("---")
st.sidebar.info("⏳ Generation can take several minutes, especially with more scenes or timelines.", icon="⏳")
st.sidebar.markdown(f"<small>Models: Text={TEXT_MODEL_ID}, Image={IMAGE_MODEL_ID}, Audio={AUDIO_MODEL_ID}</small>", unsafe_allow_html=True)


# --- Main Logic ---
if generate_button:
    if not theme:
        st.error("Please enter a story theme in the sidebar.", icon="👈")
    else:
        # Create a unique temporary directory for this run
        run_id = str(uuid.uuid4()).split('-')[0] # Short unique ID
        temp_dir = os.path.join(TEMP_DIR_BASE, f"run_{run_id}")
        try:
            os.makedirs(temp_dir, exist_ok=True)
            logger.info(f"Created temporary directory: {temp_dir}")
        except OSError as e:
            st.error(f"🚨 Failed to create temporary directory {temp_dir}: {e}", icon="📂")
            st.stop()

        final_video_paths = {} # Stores {timeline_id: video_path}
        generation_errors = {} # Stores {timeline_id: [error_messages]}

        # --- 1. Generate Narrative Structure ---
        chrono_response: Optional[ChronoWeaveResponse] = None
        with st.spinner("Generating narrative structure... 🤔"):
            chrono_response = generate_story_sequence_chrono(theme, num_scenes, num_timelines, divergence_prompt)

        if chrono_response:
            st.success(f"Narrative structure received for {len(chrono_response.timelines)} timelines.")
            logger.info(f"Successfully generated structure for {len(chrono_response.timelines)} timelines.")

            # --- 2. Process Each Timeline ---
            overall_start_time = time.time()
            all_timelines_successful = True # Assume success initially

            # Use st.status for collapsible progress updates
            with st.status("Generating assets and composing videos...", expanded=True) as status:

                for timeline_index, timeline in enumerate(chrono_response.timelines):
                    timeline_id = timeline.timeline_id
                    divergence = timeline.divergence_reason
                    segments = timeline.segments
                    timeline_label = f"Timeline {timeline_id}" # Consistent label
                    st.subheader(f"Processing {timeline_label}: {divergence}")
                    logger.info(f"--- Processing {timeline_label} (Index: {timeline_index}) ---")
                    generation_errors[timeline_id] = [] # Initialize error list

                    temp_image_files = {} # {scene_id: path}
                    temp_audio_files = {} # {scene_id: path}
                    video_clips = [] # List of moviepy clips
                    timeline_start_time = time.time()
                    scene_success_count = 0


                    for scene_index, segment in enumerate(segments):
                        scene_id = segment.scene_id
                        task_id = f"T{timeline_id}_S{scene_id}" # Unique ID
                        status_message = f"Processing {timeline_label}, Scene {scene_id + 1}/{len(segments)}..."
                        status.update(label=status_message)
                        st.markdown(f"--- **Scene {scene_id + 1} ({task_id})** ---")
                        logger.info(status_message)

                        scene_has_error = False

                        # Log scene details
                        st.write(f"   *Image Prompt:* {segment.image_prompt}" + (f" *(Modifier: {segment.timeline_visual_modifier})*" if segment.timeline_visual_modifier else ""))
                        st.write(f"   *Audio Text:* {segment.audio_text}")

                        # --- 2a. Image Generation ---
                        generated_image: Optional[Image.Image] = None # Define before spinner
                        with st.spinner(f"[{task_id}] Generating image... 🎨"):
                            combined_prompt = f"{segment.image_prompt}. {segment.character_description}"
                            if segment.timeline_visual_modifier:
                                combined_prompt += f" Visual style hint: {segment.timeline_visual_modifier}."
                            generated_image = generate_image_imagen(combined_prompt, aspect_ratio, task_id)

                        if generated_image:
                            image_path = os.path.join(temp_dir, f"{task_id}_image.png")
                            try:
                                generated_image.save(image_path)
                                temp_image_files[scene_id] = image_path
                                st.image(generated_image, width=180, caption=f"Scene {scene_id+1} Image")
                            except Exception as e:
                                logger.error(f"   ❌ [{task_id}] Failed to save image {image_path}: {e}")
                                st.error(f"Failed to save image for scene {task_id}.", icon="💾")
                                scene_has_error = True
                                generation_errors[timeline_id].append(f"Scene {scene_id+1}: Image save failed.")
                        else:
                            st.warning(f"Image generation failed for scene {task_id}. Skipping scene.", icon="🖼️")
                            scene_has_error = True
                            generation_errors[timeline_id].append(f"Scene {scene_id+1}: Image generation failed.")
                            continue # Skip audio/video for this scene

                        # --- 2b. Audio Generation ---
                        generated_audio_path: Optional[str] = None
                        if not scene_has_error:
                            with st.spinner(f"[{task_id}] Generating audio... 🔊"):
                                audio_path_temp = os.path.join(temp_dir, f"{task_id}_audio.wav")
                                try:
                                    # Run the async function using asyncio.run()
                                    generated_audio_path = asyncio.run(
                                        generate_audio_live_async(segment.audio_text, audio_path_temp, audio_voice)
                                    )
                                except RuntimeError as e:
                                    logger.error(f"   ❌ [{task_id}] Asyncio runtime error during audio gen: {e}")
                                    st.error(f"Asyncio error during audio generation for {task_id}: {e}", icon="⚡")
                                    scene_has_error = True
                                    generation_errors[timeline_id].append(f"Scene {scene_id+1}: Audio async error.")
                                except Exception as e:
                                    logger.exception(f"   ❌ [{task_id}] Unexpected error during audio generation call for {task_id}: {e}")
                                    st.error(f"Unexpected error in audio generation for {task_id}: {e}", icon="💥")
                                    scene_has_error = True
                                    generation_errors[timeline_id].append(f"Scene {scene_id+1}: Audio generation error.")

                            if generated_audio_path:
                                temp_audio_files[scene_id] = generated_audio_path
                                try:
                                    with open(generated_audio_path, 'rb') as ap:
                                        st.audio(ap.read(), format='audio/wav')
                                except Exception as e:
                                     logger.warning(f"   ⚠️ [{task_id}] Could not display audio preview: {e}")
                            else:
                                st.warning(f"Audio generation failed for {task_id}. Skipping video clip.", icon="🔊")
                                scene_has_error = True
                                generation_errors[timeline_id].append(f"Scene {scene_id+1}: Audio generation failed.")
                                # Clean up image if audio fails
                                if scene_id in temp_image_files and os.path.exists(temp_image_files[scene_id]):
                                    try:
                                        os.remove(temp_image_files[scene_id])
                                        logger.info(f"   🗑️ [{task_id}] Removed image file due to audio failure.")
                                        del temp_image_files[scene_id]
                                    except OSError as e:
                                         logger.warning(f"   ⚠️ [{task_id}] Could not remove image file {temp_image_files[scene_id]} after audio failure: {e}")
                                continue # Skip video clip creation

                        # --- 2c. Create Video Clip ---
                        if not scene_has_error and scene_id in temp_image_files and scene_id in temp_audio_files:
                            st.write(f"   🎬 Creating video clip for Scene {scene_id+1}...")
                            img_path = temp_image_files[scene_id]
                            aud_path = temp_audio_files[scene_id]
                            audio_clip_instance = None # Define before try
                            image_clip_instance = None # Define before try
                            composite_clip = None # Define before try
                            try:
                                if not os.path.exists(img_path): raise FileNotFoundError(f"Image file not found: {img_path}")
                                if not os.path.exists(aud_path): raise FileNotFoundError(f"Audio file not found: {aud_path}")

                                audio_clip_instance = AudioFileClip(aud_path)
                                np_image = np.array(Image.open(img_path))
                                image_clip_instance = ImageClip(np_image).set_duration(audio_clip_instance.duration)

                                composite_clip = image_clip_instance.set_audio(audio_clip_instance)
                                video_clips.append(composite_clip) # Add the clip to be concatenated later
                                logger.info(f"      ✅ [{task_id}] Video clip created (Duration: {audio_clip_instance.duration:.2f}s).")
                                st.write(f"      ✅ Clip created (Duration: {audio_clip_instance.duration:.2f}s).")
                                scene_success_count += 1
                                # Don't close individual clips here yet, needed for concatenation

                            except Exception as e:
                                logger.exception(f"      ❌ [{task_id}] Failed to create video clip for scene {scene_id+1}: {e}")
                                st.error(f"Failed to create video clip for {task_id}: {e}", icon="🎬")
                                scene_has_error = True
                                generation_errors[timeline_id].append(f"Scene {scene_id+1}: Video clip creation failed.")
                                # Cleanup resources if clip creation failed for *this* scene
                                if audio_clip_instance: audio_clip_instance.close()
                                if image_clip_instance: image_clip_instance.close()
                                # Attempt cleanup of related files
                                if os.path.exists(img_path): os.remove(img_path)
                                if os.path.exists(aud_path): os.remove(aud_path)

                        # --- End of Scene Loop ---

                    # --- 2d. Assemble Timeline Video ---
                    timeline_duration = time.time() - timeline_start_time
                    # Only assemble if clips were created and no *fatal* errors occurred during scene processing
                    # (We check scene_success_count against expected number)
                    if video_clips and scene_success_count == len(segments):
                        status.update(label=f"Composing final video for {timeline_label}...")
                        st.write(f"🎞️ Assembling final video for {timeline_label}...")
                        logger.info(f"🎞️ Assembling final video for {timeline_label} ({len(video_clips)} clips)...")
                        output_filename = os.path.join(temp_dir, f"timeline_{timeline_id}_final.mp4")
                        final_timeline_video = None # Define before try block
                        try:
                            # Concatenate the collected clips
                            final_timeline_video = concatenate_videoclips(video_clips, method="compose")
                            final_timeline_video.write_videofile(
                                output_filename,
                                fps=VIDEO_FPS,
                                codec=VIDEO_CODEC,
                                audio_codec=AUDIO_CODEC,
                                logger=None # Suppress moviepy console spam
                            )
                            final_video_paths[timeline_id] = output_filename
                            logger.info(f"   ✅ [{timeline_label}] Final video saved: {os.path.basename(output_filename)}")
                            st.success(f"✅ Video for {timeline_label} completed in {timeline_duration:.2f}s.")

                        except Exception as e:
                            logger.exception(f"   ❌ [{timeline_label}] Failed to write final video: {e}")
                            st.error(f"Failed to assemble video for {timeline_label}: {e}", icon="📼")
                            all_timelines_successful = False
                            generation_errors[timeline_id].append(f"Timeline {timeline_id}: Final video assembly failed.")
                        finally:
                            # Now close all individual clips and the final concatenated clip
                            logger.debug(f"[{timeline_label}] Closing {len(video_clips)} source clips...")
                            for i, clip in enumerate(video_clips):
                                try:
                                    if clip: # Check if clip object exists
                                      if clip.audio: clip.audio.close()
                                      clip.close()
                                except Exception as e_close:
                                    logger.warning(f"   ⚠️ [{timeline_label}] Error closing source clip {i}: {e_close}")
                            if final_timeline_video:
                                try:
                                     if final_timeline_video.audio: final_timeline_video.audio.close()
                                     final_timeline_video.close()
                                     logger.debug(f"[{timeline_label}] Closed final video object.")
                                except Exception as e_close_final:
                                     logger.warning(f"   ⚠️ [{timeline_label}] Error closing final video object: {e_close_final}")

                    elif not video_clips:
                        logger.warning(f"[{timeline_label}] No video clips successfully generated. Skipping final assembly.")
                        st.warning(f"No scenes were successfully processed for {timeline_label}. Video cannot be created.", icon="🚫")
                        all_timelines_successful = False
                    else: # Some scenes failed, so scene_success_count < len(segments)
                        error_count = len(segments) - scene_success_count
                        logger.warning(f"[{timeline_label}] Encountered errors in {error_count} scene(s). Skipping final video assembly.")
                        st.warning(f"{timeline_label} had errors in {error_count} scene(s). Final video not assembled.", icon="⚠️")
                        all_timelines_successful = False

                    # Log accumulated errors for the timeline if any occurred
                    if generation_errors[timeline_id]:
                         logger.error(f"Summary of errors in {timeline_label}: {generation_errors[timeline_id]}")

                # --- End of Timelines Loop ---

                # Final status update
                overall_duration = time.time() - overall_start_time
                if all_timelines_successful and final_video_paths:
                    status_msg = f"ChronoWeave Generation Complete! ({len(final_video_paths)} videos in {overall_duration:.2f}s)"
                    status.update(label=status_msg, state="complete", expanded=False)
                    logger.info(status_msg)
                elif final_video_paths: # Some videos made, but errors occurred
                    status_msg = f"ChronoWeave Partially Complete ({len(final_video_paths)} videos, some errors occurred). Total time: {overall_duration:.2f}s"
                    status.update(label=status_msg, state="warning", expanded=True)
                    logger.warning(status_msg)
                else: # No videos made
                    status_msg = f"ChronoWeave Generation Failed. No videos produced. Total time: {overall_duration:.2f}s"
                    status.update(label=status_msg, state="error", expanded=True)
                    logger.error(status_msg)

            # --- 3. Display Results ---
            st.header("🎬 Generated Timelines")
            if final_video_paths:
                sorted_timeline_ids = sorted(final_video_paths.keys())
                # Adjust column count based on number of videos, max 3-4 wide?
                num_cols = min(len(sorted_timeline_ids), 3)
                cols = st.columns(num_cols)

                for idx, timeline_id in enumerate(sorted_timeline_ids):
                    col = cols[idx % num_cols] # Cycle through columns
                    video_path = final_video_paths[timeline_id]
                    timeline_data = next((t for t in chrono_response.timelines if t.timeline_id == timeline_id), None)
                    reason = timeline_data.divergence_reason if timeline_data else "Unknown Divergence"

                    with col:
                        st.subheader(f"Timeline {timeline_id}")
                        st.caption(f"Divergence: {reason}")
                        try:
                            with open(video_path, 'rb') as video_file:
                                video_bytes = video_file.read()
                            st.video(video_bytes)
                            logger.info(f"Displaying video for Timeline {timeline_id}")
                            st.download_button(
                                label=f"Download T{timeline_id} Video",
                                data=video_bytes,
                                file_name=f"chronoweave_timeline_{timeline_id}.mp4",
                                mime="video/mp4",
                                key=f"download_btn_{timeline_id}" # Unique key for download button
                            )
                            # Display errors for this timeline if any occurred
                            if generation_errors.get(timeline_id):
                                with st.expander(f"⚠️ View {len(generation_errors[timeline_id])} Generation Issues"):
                                     for error_msg in generation_errors[timeline_id]:
                                         st.warning(f"- {error_msg}")

                        except FileNotFoundError:
                             logger.error(f"Could not find video file for display: {video_path}")
                             st.error(f"Error: Video file not found for Timeline {timeline_id}.", icon="🚨")
                        except Exception as e:
                             logger.exception(f"Could not display video {video_path}: {e}")
                             st.error(f"Error displaying video for Timeline {timeline_id}: {e}", icon="🚨")
            else:
                st.warning("No final videos were successfully generated in this run.")
                # Display summary of all errors if no videos were made
                all_errors = [msg for err_list in generation_errors.values() for msg in err_list]
                if all_errors:
                    st.subheader("Summary of Generation Issues")
                    with st.expander("View All Errors", expanded=True):
                        for tid, errors in generation_errors.items():
                            if errors:
                                st.error(f"Timeline {tid}:")
                                for msg in errors:
                                    st.error(f"  - {msg}")

            # --- 4. Cleanup ---
            st.info(f"Attempting to clean up temporary directory: {temp_dir}")
            try:
                shutil.rmtree(temp_dir)
                logger.info(f"✅ Temporary directory removed: {temp_dir}")
                st.success("✅ Temporary files cleaned up.")
            except Exception as e:
                logger.error(f"⚠️ Could not remove temporary directory {temp_dir}: {e}")
                st.warning(f"Could not automatically remove temporary files: {temp_dir}. Please remove it manually if needed.", icon="⚠️")

        elif not chrono_response:
            # Error message likely already shown by generate_story_sequence_chrono
            logger.error("Story generation failed, cannot proceed.")
        else:
            # Fallback for unexpected state
            st.error("An unexpected issue occurred after story generation. Cannot proceed.", icon="🛑")
            logger.error("Chrono_response existed but was falsy in the main logic block.")

else:
    st.info("Configure settings in the sidebar and click '✨ Generate ChronoWeave ✨' to start.")