Spaces:

mgbam
/

StoryVerseWeaver

Sleeping

App Files Files Community

mgbam commited on May 17

Commit

1c5c923

verified ·

1 Parent(s): fe60278

Update app.py

Browse files

Files changed (1) hide show

app.py +204 -160

app.py CHANGED Viewed

@@ -2,59 +2,102 @@
 import gradio as gr
 import os
 import time
-from PIL import Image
 # --- Core Logic Imports ---
 from core.llm_services import initialize_text_llms, is_gemini_text_ready, is_hf_text_ready, generate_text_gemini, generate_text_hf
-from core.image_services import initialize_image_llms, STABILITY_API_CONFIGURED, OPENAI_DALLE_CONFIGURED, generate_image_stabilityai, generate_image_dalle # Add other providers if implemented
-from core.story_engine import Story, Scene # Manages the story
 from prompts.narrative_prompts import get_narrative_system_prompt, format_narrative_user_prompt
 from prompts.image_style_prompts import STYLE_PRESETS, COMMON_NEGATIVE_PROMPTS, format_image_generation_prompt
 from core.utils import basic_text_cleanup
-# --- Initialize Services ---
 initialize_text_llms()
 initialize_image_llms()
-# --- Available Model Configuration (Simplified for StoryVerse) ---
-# Text Models
 TEXT_MODELS = {}
-if is_gemini_text_ready():
-    TEXT_MODELS["Gemini 1.5 Flash (Text)"] = {"id": "gemini-1.5-flash-latest", "type": "gemini"}
-    TEXT_MODELS["Gemini 1.0 Pro (Text)"] = {"id": "gemini-1.0-pro-latest", "type": "gemini"}
-if is_hf_text_ready():
     TEXT_MODELS["Mistral 7B (HF Text)"] = {"id": "mistralai/Mistral-7B-Instruct-v0.2", "type": "hf_text"}
-DEFAULT_TEXT_MODEL_KEY = list(TEXT_MODELS.keys())[0] if TEXT_MODELS else "No Text Models Available"
-# Image Models (Providers)
 IMAGE_PROVIDERS = {}
-if STABILITY_API_CONFIGURED: IMAGE_PROVIDERS["Stability AI (Stable Diffusion XL)"] = "stability_ai"
-if OPENAI_DALLE_CONFIGURED: IMAGE_PROVIDERS["OpenAI DALL-E 3 (Simulated)"] = "dalle"
-# Add other HF image models if you implement image_services.generate_image_hf_model
-DEFAULT_IMAGE_PROVIDER_KEY = list(IMAGE_PROVIDERS.keys())[0] if IMAGE_PROVIDERS else "No Image Providers Available"
 # --- Gradio UI Theme and CSS ---
 story_theme = gr.themes.Soft(
     primary_hue=gr.themes.colors.purple,
     secondary_hue=gr.themes.colors.pink,
     font=[gr.themes.GoogleFont("Quicksand"), "ui-sans-serif", "system-ui", "sans-serif"]
 )
 custom_css = """
-.gradio-container { max-width: 1200px !important; margin: auto !important; }
-.panel_image img { object-fit: contain; width: 100%; height: 100%; max-height: 512px; }
-.gallery_output .thumbnail-item { height: 150px !important; width: 150px !important; }
 .gallery_output .thumbnail-item img { height: 100% !important; width: 100% !important; object-fit: cover !important; }
-.status_text { font-weight: bold; padding: 8px; text-align: center; border-radius: 5px; margin-top:10px;}
-.error_text { background-color: #ffebee; color: #c62828; }
-.success_text { background-color: #e8f5e9; color: #2e7d32; }
-.processing_text { background-color: #e3f2fd; color: #1565c0; }
-.compact-row .gr-form {gap: 8px !important;} /* Reduce gap in rows */
 """
 # --- StoryVerse Weaver Orchestrator ---
 def add_scene_to_story(
-    current_story_obj: Story, # Comes from gr.State
     scene_prompt_text: str,
     image_style_dropdown: str,
     artist_style_text: str,
@@ -64,183 +107,178 @@ def add_scene_to_story(
     progress=gr.Progress(track_tqdm=True)
 ):
     if not scene_prompt_text.strip():
-        return current_story_obj, None, "<p class='error_text status_text'>Scene prompt cannot be empty!</p>"
     progress(0, desc="Initializing new scene...")
-    log_updates = ["Starting new scene generation..."]
     # --- 1. Generate Narrative Text ---
-    progress(0.2, desc="Generating narrative...")
-    narrative_text_generated = "Narrative generation failed."
     text_model_info = TEXT_MODELS.get(text_model_key)
-    if text_model_info:
-        system_p = get_narrative_system_prompt("default") # or "comic"
-        # Could use last scene's narrative for context if desired
-        # prev_narrative = current_story_obj.get_last_scene_narrative()
-        user_p = format_narrative_user_prompt(scene_prompt_text) #, prev_narrative)
         text_response = None
         if text_model_info["type"] == "gemini":
-            text_response = generate_text_gemini(user_p, model_id=text_model_info["id"], system_prompt=system_p, max_tokens=300)
         elif text_model_info["type"] == "hf_text":
-            text_response = generate_text_hf(user_p, model_id=text_model_info["id"], system_prompt=system_p, max_tokens=300)
         if text_response and text_response.success:
             narrative_text_generated = basic_text_cleanup(text_response.text)
-            log_updates.append(f"Narrative generated using {text_model_key}.")
         elif text_response:
-            narrative_text_generated = f"Narrative Error: {text_response.error}"
-            log_updates.append(f"Narrative generation FAILED with {text_model_key}: {text_response.error}")
         else:
-             log_updates.append(f"Narrative generation FAILED with {text_model_key}: No response object.")
     else:
-        narrative_text_generated = "Selected text model not available."
-        log_updates.append("Narrative generation FAILED: Text model not found.")
     # --- 2. Generate Image ---
-    progress(0.6, desc="Generating image...")
-    image_generated = None
-    image_error = None
-    selected_image_provider = IMAGE_PROVIDERS.get(image_provider_key)
-    # Use the generated narrative (or original prompt if narrative failed) for image prompt
-    image_content_prompt = narrative_text_generated if narrative_text_generated and "Error" not in narrative_text_generated else scene_prompt_text
-    full_image_prompt = format_image_generation_prompt(image_content_prompt[:300], image_style_dropdown, artist_style_text) # Limit prompt length for image gen
-    if selected_image_provider:
-        image_response = None
-        if selected_image_provider == "stability_ai":
-            image_response = generate_image_stabilityai(full_image_prompt, style_preset=None, negative_prompt=negative_prompt_text or COMMON_NEGATIVE_PROMPTS)
-        elif selected_image_provider == "dalle":
-            image_response = generate_image_dalle(full_image_prompt) # Uses default DALL-E settings from image_services
         # Add elif for HF image models if implemented
         if image_response and image_response.success:
-            image_generated = image_response.image
-            log_updates.append(f"Image generated using {image_provider_key}.")
         elif image_response:
-            image_error = f"Image Error ({image_provider_key}): {image_response.error}"
-            log_updates.append(f"Image generation FAILED with {image_provider_key}: {image_response.error}")
         else:
-            image_error = f"Image generation failed: No response from {image_provider_key} service."
-            log_updates.append(f"Image generation FAILED with {image_provider_key}: No response object.")
     else:
-        image_error = "Selected image provider not available."
-        log_updates.append("Image generation FAILED: Image provider not found.")
     # --- 3. Add Scene to Story Object ---
-    if image_error and "Error" in narrative_text_generated: # Both failed
-        current_story_obj.add_scene_with_error(scene_prompt_text, f"Narrative: {narrative_text_generated}. Image: {image_error}")
-    else:
-        current_story_obj.add_scene_from_elements(
-            user_prompt=scene_prompt_text,
-            narrative_text=narrative_text_generated,
-            image=image_generated,
-            image_style_prompt=f"{image_style_dropdown}{f', by {artist_style_text}' if artist_style_text else ''}",
-            image_provider=image_provider_key
-        )
     progress(1.0, desc="Scene complete!")
     # --- 4. Prepare Outputs for Gradio ---
-    # Gallery expects list of (image_path_or_PIL, caption_string) tuples
-    gallery_items = []
-    for scene in current_story_obj.scenes:
-        caption = f"S{scene.scene_number}: {scene.user_prompt[:40]}..."
-        if scene.error_message:
-            # Create a placeholder image for errors or display error text
-            error_img = Image.new('RGB', (100,100), color='red') # Simple red square
-            gallery_items.append((error_img, f"{caption}\nError: {scene.error_message[:100]}..."))
-        else:
-            gallery_items.append((scene.image if scene.image else Image.new('RGB', (100,100), color='grey'), caption)) # Grey if no image but no error
-    # Display the latest scene's full details
-    latest_scene_display = ""
-    if current_story_obj.scenes:
-        ls = current_story_obj.scenes[-1]
-        latest_scene_display = f"## Scene {ls.scene_number}: {ls.user_prompt}\n\n"
-        if ls.error_message:
-            latest_scene_display += f"**Error:** {ls.error_message}\n"
-        else:
-            if ls.image:
-                # Gradio Markdown can't directly display PIL.Image. We'll show it in the gallery.
-                # For single image display, use gr.Image component.
-                latest_scene_display += f"**Style:** {ls.image_style_prompt}\n\n"
-            latest_scene_display += f"{ls.narrative_text}"
-    # Determine status message
     status_message_html = ""
-    if image_error or "Error" in narrative_text_generated:
-        status_message_html = f"<p class='error_text status_text'>Scene added with errors. Narrative: {'OK' if 'Error' not in narrative_text_generated else 'Failed'}. Image: {'OK' if not image_error else 'Failed'}.</p>"
     else:
-        status_message_html = "<p class='success_text status_text'>New scene added successfully!</p>"
-    # For the single image display component, show the latest generated image
-    latest_image_output = image_generated if image_generated else None # (or a placeholder if error)
-    return current_story_obj, gallery_items, latest_image_output, latest_scene_display, status_message_html, "\n".join(log_updates)
-def clear_story_state():
     new_story = Story()
-    return new_story, [], None, "Story Cleared. Ready for a new verse!", "<p class='status_text'>Story Cleared</p>", "Log Cleared."
 # --- Gradio UI Definition ---
-with gr.Blocks(theme=story_theme, css=custom_css) as story_weaver_demo:
     story_state = gr.State(Story()) # Manages the story object
-    gr.Markdown("# ✨ StoryVerse Weaver ✨\nCreate multimodal stories with AI-generated narrative and images!")
-    # API Status Check (Conceptual - real app might hide this or make it admin-only)
-    with gr.Accordion("API & Model Status (Developer Info)", open=False):
-        status_text = []
-        if not GEMINI_API_READY and not HF_API_READY and not STABILITY_API_CONFIGURED and not OPENAI_DALLE_CONFIGURED:
-            status_text.append("<p style='color:red;font-weight:bold;'>⚠️ CRITICAL: NO APIs CONFIGURED. App will be non-functional.</p>")
-        else:
-            if GEMINI_API_READY or HF_API_READY: status_text.append("<p style='color:green;'>✅ Text LLM(s) Ready.</p>")
-            else: status_text.append("<p style='color:orange;'>⚠️ No Text LLMs Ready (Check STORYVERSE_GOOGLE_API_KEY/STORYVERSE_HF_TOKEN).</p>")
-            if STABILITY_API_CONFIGURED or OPENAI_DALLE_CONFIGURED: status_text.append("<p style='color:green;'>✅ Image Generation Service(s) Ready.</p>")
-            else: status_text.append("<p style='color:orange;'>⚠️ No Image Generation Services Ready (Check API Keys).</p>")
-        gr.HTML("".join(status_text))
-    with gr.Row():
         # --- CONTROL PANEL (Inputs) ---
-        with gr.Column(scale=1):
-            gr.Markdown("### 🎬 Scene Input")
-            scene_prompt_input = gr.Textbox(lines=5, label="Describe your scene or story beat:", placeholder="e.g., A lone astronaut discovers a glowing alien artifact on a desolate moon.")
             with gr.Accordion("🎨 Visual Style (Optional)", open=True):
-                image_style_input = gr.Dropdown(choices=["Default"] + list(STYLE_PRESETS.keys()), value="Default", label="Image Style Preset")
-                artist_style_input = gr.Textbox(label="Inspired by Artist (Optional):", placeholder="e.g., Van Gogh, Hayao Miyazaki, HR Giger")
-                negative_prompt_input = gr.Textbox(lines=2, label="Negative Prompt (Optional):", placeholder="e.g., blurry, text, watermark, poorly drawn", value=COMMON_NEGATIVE_PROMPTS)
             with gr.Accordion("⚙️ AI Configuration (Advanced)", open=False):
-                text_model_dropdown = gr.Dropdown(choices=list(TEXT_MODELS.keys()), value=DEFAULT_TEXT_MODEL_KEY, label="Text Generation Model")
-                image_provider_dropdown = gr.Dropdown(choices=list(IMAGE_PROVIDERS.keys()), value=DEFAULT_IMAGE_PROVIDER_KEY, label="Image Generation Provider")
-                # Could add sliders for temperature, tokens etc. here later
-            with gr.Row(elem_classes=["compact-row"]):
-                add_scene_button = gr.Button("➕ Weave Next Scene", variant="primary")
-                clear_story_button = gr.Button("🗑️ Clear Story")
-            status_bar_output = gr.HTML(value="<p class='status_text'>Ready to weave...</p>")
         # --- STORY DISPLAY (Outputs) ---
-        with gr.Column(scale=2):
-            gr.Markdown("### 📖 Your StoryVerse So Far")
             with gr.Tabs():
-                with gr.TabItem("🖼️ Latest Scene View"):
-                    latest_scene_image_output = gr.Image(label="Latest Scene Image", type="pil", interactive=False, show_download_button=True, elem_classes=["panel_image"])
-                    latest_scene_narrative_output = gr.Markdown(label="Latest Scene Narrative")
-                with gr.TabItem(" галерея | Story Scroll"): # Gallery in Russian, for fun :)
-                    story_gallery_output = gr.Gallery(label="Story Scroll", show_label=False, columns=[3], object_fit="contain", height="auto", elem_classes=["gallery_output"])
-                with gr.TabItem("📜 Interaction Log"):
                     log_output_markdown = gr.Markdown("Log will appear here...")
     # --- Event Handlers ---
@@ -251,14 +289,14 @@ with gr.Blocks(theme=story_theme, css=custom_css) as story_weaver_demo:
             image_style_input, artist_style_input, negative_prompt_input,
             text_model_dropdown, image_provider_dropdown
         ],
-        outputs=[ # Order must match the return order of add_scene_to_story
             story_state, story_gallery_output,
             latest_scene_image_output, latest_scene_narrative_output,
             status_bar_output, log_output_markdown
         ]
     )
     clear_story_button.click(
-        fn=clear_story_state,
         inputs=[],
         outputs=[
             story_state, story_gallery_output,
@@ -267,33 +305,39 @@ with gr.Blocks(theme=story_theme, css=custom_css) as story_weaver_demo:
         ]
     )
-    # Example Prompts for User
     gr.Examples(
         examples=[
-            ["A knight faces a dragon in a fiery volcano.", "Fantasy Art", "Frank Frazetta", "blurry, low quality"],
-            ["A futuristic detective investigates a crime in a neon-lit alley.", "Cyberpunk", "Syd Mead", "cartoon, painting"],
-            ["Two children discover a hidden portal in an old oak tree.", "Studio Ghibli Inspired", "", "dark, scary"],
-            ["A single red rose blooming in a post-apocalyptic wasteland.", "Photorealistic", "Ansel Adams", "oversaturated, vibrant"],
         ],
         inputs=[scene_prompt_input, image_style_input, artist_style_input, negative_prompt_input],
-        label="✨ Example Scene Ideas & Styles ✨"
     )
 # --- Entry Point ---
 if __name__ == "__main__":
     print("="*80)
     print("✨ StoryVerse Weaver™ - Multimodal Story Creator - Launching... ✨")
-    print(f"  Text LLM Ready (Gemini): {is_gemini_text_ready()}")
-    print(f"  Text LLM Ready (HF): {is_hf_text_ready()}")
-    print(f"  Image Provider Ready (Stability AI): {STABILITY_API_CONFIGURED}")
-    print(f"  Image Provider Ready (DALL-E): {OPENAI_DALLE_CONFIGURED}")
-    if not (is_gemini_text_ready() or is_hf_text_ready()) or not (STABILITY_API_CONFIGURED or OPENAI_DALLE_CONFIGURED):
-        print("  🔴 WARNING: Not all required API services are configured. Functionality will be limited or fail.")
-        print("     Please set: STORYVERSE_GOOGLE_API_KEY (for Gemini text), and/or STORYVERSE_HF_TOKEN (for HF text),")
-        print("     AND STORYVERSE_STABILITY_API_KEY (for Stability AI images) or STORYVERSE_OPENAI_API_KEY (for DALL-E images) in your environment/secrets.")
-    print(f"  Default Text Model: {DEFAULT_TEXT_MODEL_KEY}")
-    print(f"  Default Image Provider: {DEFAULT_IMAGE_PROVIDER_KEY}")
     print(f"  Available Text Models: {list(TEXT_MODELS.keys())}")
     print(f"  Available Image Providers: {list(IMAGE_PROVIDERS.keys())}")
     print("="*80)
     story_weaver_demo.launch(debug=True, server_name="0.0.0.0")

 import gradio as gr
 import os
 import time
+from PIL import Image # Ensure Pillow is in requirements.txt
 # --- Core Logic Imports ---
+# Import initialization functions and status getters/flags
 from core.llm_services import initialize_text_llms, is_gemini_text_ready, is_hf_text_ready, generate_text_gemini, generate_text_hf
+from core.image_services import initialize_image_llms, STABILITY_API_CONFIGURED, OPENAI_DALLE_CONFIGURED, generate_image_stabilityai, generate_image_dalle
+from core.story_engine import Story, Scene # Manages the story object
 from prompts.narrative_prompts import get_narrative_system_prompt, format_narrative_user_prompt
 from prompts.image_style_prompts import STYLE_PRESETS, COMMON_NEGATIVE_PROMPTS, format_image_generation_prompt
 from core.utils import basic_text_cleanup
+# --- Initialize All External Services ONCE at App Startup ---
 initialize_text_llms()
 initialize_image_llms()
+# --- Get API Readiness Status AFTER initialization for use in this module ---
+GEMINI_TEXT_IS_READY = is_gemini_text_ready()
+HF_TEXT_IS_READY = is_hf_text_ready()
+STABILITY_API_IS_READY = STABILITY_API_CONFIGURED # Directly use the flag from image_services
+OPENAI_DALLE_IS_READY = OPENAI_DALLE_CONFIGURED   # Directly use the flag from image_services
+# --- Application Configuration (Models, Defaults) ---
 TEXT_MODELS = {}
+UI_DEFAULT_TEXT_MODEL_KEY = None
+if GEMINI_TEXT_IS_READY:
+    TEXT_MODELS["✨ Gemini 1.5 Flash (Text)"] = {"id": "gemini-1.5-flash-latest", "type": "gemini"}
+    TEXT_MODELS["Legacy Gemini 1.0 Pro (Text)"] = {"id": "gemini-1.0-pro-latest", "type": "gemini"}
+if HF_TEXT_IS_READY:
     TEXT_MODELS["Mistral 7B (HF Text)"] = {"id": "mistralai/Mistral-7B-Instruct-v0.2", "type": "hf_text"}
+    TEXT_MODELS["Gemma 2B (HF Text)"] = {"id": "google/gemma-2b-it", "type": "hf_text"}
+if TEXT_MODELS:
+    if "✨ Gemini 1.5 Flash (Text)" in TEXT_MODELS: UI_DEFAULT_TEXT_MODEL_KEY = "✨ Gemini 1.5 Flash (Text)"
+    elif "Mistral 7B (HF Text)" in TEXT_MODELS: UI_DEFAULT_TEXT_MODEL_KEY = "Mistral 7B (HF Text)"
+    else: UI_DEFAULT_TEXT_MODEL_KEY = list(TEXT_MODELS.keys())[0]
+else:
+    TEXT_MODELS["No Text Models Available"] = {"id": "dummy_text_error", "type": "none"}
+    UI_DEFAULT_TEXT_MODEL_KEY = "No Text Models Available"
 IMAGE_PROVIDERS = {}
+UI_DEFAULT_IMAGE_PROVIDER_KEY = None
+if STABILITY_API_IS_READY:
+    IMAGE_PROVIDERS["🎨 Stability AI (Stable Diffusion XL)"] = "stability_ai"
+if OPENAI_DALLE_IS_READY:
+    IMAGE_PROVIDERS["🖼️ OpenAI DALL-E 3 (Simulated)"] = "dalle"
+# Add other HF image models if you implement image_services.generate_image_hf_model, e.g.:
+# if is_hf_text_ready(): # Re-use HF token if image model uses it
+#     IMAGE_PROVIDERS["🎡 HF Diffusers Model (Simulated)"] = "hf_image_model"
+if IMAGE_PROVIDERS:
+    if "🎨 Stability AI (Stable Diffusion XL)" in IMAGE_PROVIDERS: UI_DEFAULT_IMAGE_PROVIDER_KEY = "🎨 Stability AI (Stable Diffusion XL)"
+    elif "🖼️ OpenAI DALL-E 3 (Simulated)" in IMAGE_PROVIDERS: UI_DEFAULT_IMAGE_PROVIDER_KEY = "🖼️ OpenAI DALL-E 3 (Simulated)"
+    else: UI_DEFAULT_IMAGE_PROVIDER_KEY = list(IMAGE_PROVIDERS.keys())[0]
+else:
+    IMAGE_PROVIDERS["No Image Providers Available"] = "none"
+    UI_DEFAULT_IMAGE_PROVIDER_KEY = "No Image Providers Available"
 # --- Gradio UI Theme and CSS ---
 story_theme = gr.themes.Soft(
     primary_hue=gr.themes.colors.purple,
     secondary_hue=gr.themes.colors.pink,
+    neutral_hue=gr.themes.colors.slate,
     font=[gr.themes.GoogleFont("Quicksand"), "ui-sans-serif", "system-ui", "sans-serif"]
 )
 custom_css = """
+body { font-family: 'Quicksand', sans-serif; background-color: #f0f2f5; }
+.gradio-container { max-width: 1280px !important; margin: auto !important; background-color: #ffffff; border-radius: 15px; box-shadow: 0 8px 24px rgba(0,0,0,0.1); padding: 20px !important;}
+.panel_image img { object-fit: contain; width: 100%; max-height: 512px; border-radius: 8px; box-shadow: 0 4px 12px rgba(0,0,0,0.1); }
+.gallery_output { background-color: #f8f9fa !important; border-radius: 8px; padding: 10px; }
+.gallery_output .thumbnail-item { height: 160px !important; width: 160px !important; border-radius: 6px; overflow: hidden; box-shadow: 0 2px 6px rgba(0,0,0,0.08); margin: 5px !important;}
 .gallery_output .thumbnail-item img { height: 100% !important; width: 100% !important; object-fit: cover !important; }
+.status_text { font-weight: 500; padding: 10px 15px; text-align: center; border-radius: 6px; margin-top:10px; transition: all 0.3s ease;}
+.error_text { background-color: #ffcdd2; color: #b71c1c; border: 1px solid #ef9a9a;} /* Red family */
+.success_text { background-color: #c8e6c9; color: #1b5e20; border: 1px solid #a5d6a7;} /* Green family */
+.processing_text { background-color: #bbdefb; color: #0d47a1; border: 1px solid #90caf9;} /* Blue family */
+.compact-row .gr-form {gap: 8px !important;}
+.gr-button-primary {
+    background: linear-gradient(135deg, #667eea 0%, #764ba2 100%) !important; /* Purple gradient */
+    color: white !important; border: none !important; box-shadow: 0 4px 8px rgba(0,0,0,0.15) !important;
+    font-weight: 600 !important; transition: all 0.2s ease-in-out !important; padding: 10px 20px !important; border-radius: 8px !important;
+}
+.gr-button-primary:hover { transform: translateY(-2px) !important; box-shadow: 0 6px 12px rgba(0,0,0,0.2) !important; }
+.gr-button-secondary { border-radius: 8px !important; }
+.gr-markdown h1, .gr-markdown h2, .gr-markdown h3 { color: #4A00E0; } /* Purple headers */
+.accordion-section .gr-markdown { padding-top: 5px; padding-bottom: 5px; }
+.output-tabs .gr-tabitem {min-height: 450px;}
+.important-note { background-color: #fff3cd; border-left: 5px solid #ffeeba; padding: 10px; margin-bottom:15px; color: #856404; border-radius: 4px;}
 """
 # --- StoryVerse Weaver Orchestrator ---
 def add_scene_to_story(
+    current_story_obj: Story,
     scene_prompt_text: str,
     image_style_dropdown: str,
     artist_style_text: str,
     progress=gr.Progress(track_tqdm=True)
 ):
     if not scene_prompt_text.strip():
+        return current_story_obj, [], None, "## Error\nScene prompt cannot be empty!", "<p class='error_text status_text'>Scene prompt cannot be empty!</p>", "Log: Scene prompt empty."
     progress(0, desc="Initializing new scene...")
+    log_accumulator = [f"**New Scene Generation - {time.strftime('%H:%M:%S')}**"]
+    if not current_story_obj: current_story_obj = Story() # Safety net
     # --- 1. Generate Narrative Text ---
+    progress(0.15, desc="✍️ Generating narrative...")
+    narrative_text_generated = f"Narrative generation failed for '{scene_prompt_text[:30]}...'."
     text_model_info = TEXT_MODELS.get(text_model_key)
+    if text_model_info and text_model_info["type"] != "none":
+        system_p = get_narrative_system_prompt("default")
+        prev_narrative = current_story_obj.get_last_scene_narrative()
+        user_p = format_narrative_user_prompt(scene_prompt_text, prev_narrative)
         text_response = None
+        log_accumulator.append(f"  Narrative: Using {text_model_key} ({text_model_info['id']})")
         if text_model_info["type"] == "gemini":
+            text_response = generate_text_gemini(user_p, model_id=text_model_info["id"], system_prompt=system_p, max_tokens=350)
         elif text_model_info["type"] == "hf_text":
+            text_response = generate_text_hf(user_p, model_id=text_model_info["id"], system_prompt=system_p, max_tokens=350)
         if text_response and text_response.success:
             narrative_text_generated = basic_text_cleanup(text_response.text)
+            log_accumulator.append(f"  Narrative: Success. (Snippet: {narrative_text_generated[:50]}...)")
         elif text_response:
+            narrative_text_generated = f"**Narrative Error ({text_model_key}):** {text_response.error}"
+            log_accumulator.append(f"  Narrative: FAILED - {text_response.error}")
         else:
+             log_accumulator.append(f"  Narrative: FAILED - No response object from {text_model_key}.")
     else:
+        narrative_text_generated = "**Narrative Error:** Selected text model not available or misconfigured."
+        log_accumulator.append(f"  Narrative: FAILED - Model '{text_model_key}' not available.")
     # --- 2. Generate Image ---
+    progress(0.55, desc="🎨 Generating image...")
+    image_generated_pil = None
+    image_generation_error_message = None
+    selected_image_provider_type = IMAGE_PROVIDERS.get(image_provider_key)
+    image_content_prompt_for_gen = narrative_text_generated if narrative_text_generated and "Error" not in narrative_text_generated else scene_prompt_text
+    full_image_prompt = format_image_generation_prompt(image_content_prompt_for_gen[:350], image_style_dropdown, artist_style_text) # Limit length
+    log_accumulator.append(f"  Image: Using {image_provider_key}. Style: {image_style_dropdown}. Artist: {artist_style_text or 'N/A'}.")
+    log_accumulator.append(f"  Image Prompt (Base): {image_content_prompt_for_gen[:70]}...")
+    if selected_image_provider_type and selected_image_provider_type != "none":
+        image_response = None # type: ImageGenResponse
+        if selected_image_provider_type == "stability_ai":
+            image_response = generate_image_stabilityai(full_image_prompt, negative_prompt=negative_prompt_text or COMMON_NEGATIVE_PROMPTS)
+        elif selected_image_provider_type == "dalle":
+            image_response = generate_image_dalle(full_image_prompt)
         # Add elif for HF image models if implemented
         if image_response and image_response.success:
+            image_generated_pil = image_response.image
+            log_accumulator.append(f"  Image: Success from {image_response.provider}.")
         elif image_response:
+            image_generation_error_message = f"**Image Error ({image_response.provider}):** {image_response.error}"
+            log_accumulator.append(f"  Image: FAILED - {image_response.error}")
         else:
+            image_generation_error_message = f"**Image Error:** No response object from {image_provider_key} service."
+            log_accumulator.append(f"  Image: FAILED - No response object from {image_provider_key}.")
     else:
+        image_generation_error_message = "**Image Error:** Selected image provider not available or misconfigured."
+        log_accumulator.append(f"  Image: FAILED - Provider '{image_provider_key}' not available.")
     # --- 3. Add Scene to Story Object ---
+    final_scene_error = None
+    if image_generation_error_message and "**Narrative Error**" in narrative_text_generated :
+        final_scene_error = f"{narrative_text_generated}\n{image_generation_error_message}"
+    elif "**Narrative Error**" in narrative_text_generated:
+        final_scene_error = narrative_text_generated
+    elif image_generation_error_message:
+        final_scene_error = image_generation_error_message
+        # Keep generated narrative even if image fails
+    current_story_obj.add_scene_from_elements(
+        user_prompt=scene_prompt_text,
+        narrative_text=narrative_text_generated if "**Narrative Error**" not in narrative_text_generated else "(Narrative generation failed, see error above/below)",
+        image=image_generated_pil,
+        image_style_prompt=f"{image_style_dropdown}{f', by {artist_style_text}' if artist_style_text and artist_style_text.strip() else ''}",
+        image_provider=image_provider_key if selected_image_provider_type != "none" else "N/A",
+        error_message=final_scene_error
+    )
     progress(1.0, desc="Scene complete!")
     # --- 4. Prepare Outputs for Gradio ---
+    gallery_items_tuples = current_story_obj.get_all_scenes_for_gallery_display()
+    latest_img_for_display, latest_narr_for_display = current_story_obj.get_latest_scene_details_for_display()
     status_message_html = ""
+    if final_scene_error:
+        status_message_html = f"<p class='error_text status_text'>Scene added with errors. Check details.</p>"
     else:
+        status_message_html = "<p class='success_text status_text'>✨ New scene woven into your StoryVerse! ✨</p>"
+    return current_story_obj, gallery_items_tuples, latest_img_for_display, latest_narr_for_display, status_message_html, "\n".join(log_accumulator)
+def clear_story_state_ui():
     new_story = Story()
+    # Create a placeholder for the gallery when cleared
+    placeholder_img = Image.new('RGB', (150,150), color='lightgrey')
+    cleared_gallery = [(placeholder_img, "Your StoryVerse is empty. Weave a new scene!")]
+    return new_story, cleared_gallery, None, "## Story Cleared\nReady for a new verse!", "<p class='status_text'>Story Cleared. Let's begin anew!</p>", "Log Cleared."
 # --- Gradio UI Definition ---
+with gr.Blocks(theme=story_theme, css=custom_css, title="✨ StoryVerse Weaver ✨") as story_weaver_demo:
     story_state = gr.State(Story()) # Manages the story object
+    gr.Markdown("# ✨ StoryVerse Weaver ✨\n### Weave Multimodal Stories with AI-Generated Narrative and Images!")
+    gr.HTML("<div class='important-note'>Provide a scene idea and style, then click 'Weave Next Scene'. API keys for text (Gemini or HF) and image generation (Stability AI or DALL-E) must be set in Space Secrets as `STORYVERSE_...` variables.</div>")
+    # API Status (More user-friendly)
+    with gr.Accordion("🔧 AI Services Status", open=False):
+        status_text_list = []
+        text_llm_ok = GEMINI_TEXT_IS_READY or HF_TEXT_IS_READY
+        image_gen_ok = STABILITY_API_IS_READY or OPENAI_DALLE_IS_READY
+        if not text_llm_ok and not image_gen_ok:
+            status_text_list.append("<p style='color:red;font-weight:bold;'>⚠️ CRITICAL: NO AI SERVICES CONFIGURED. App will not function. Please set API keys in Space Secrets.</p>")
+        else:
+            if text_llm_ok: status_text_list.append("<p style='color:green;'>✅ Text Generation Service(s) Ready.</p>")
+            else: status_text_list.append("<p style='color:orange;'>⚠️ Text Generation Service(s) NOT Ready (Check STORYVERSE_GOOGLE_API_KEY / STORYVERSE_HF_TOKEN).</p>")
+            if image_gen_ok: status_text_list.append("<p style='color:green;'>✅ Image Generation Service(s) Ready.</p>")
+            else: status_text_list.append("<p style='color:orange;'>⚠️ Image Generation Service(s) NOT Ready (Check STORYVERSE_STABILITY_API_KEY / STORYVERSE_OPENAI_API_KEY).</p>")
+        gr.HTML("".join(status_text_list))
+    with gr.Row(equal_height=False):
         # --- CONTROL PANEL (Inputs) ---
+        with gr.Column(scale=2, min_width=380): # Adjusted scale
+            gr.Markdown("### 🎬 **Input Your Scene Idea**")
+            with gr.Group():
+                scene_prompt_input = gr.Textbox(lines=6, label="Scene Description / Story Beat:", placeholder="e.g., A lone astronaut discovers a glowing alien artifact on a desolate, red moon, casting long shadows.")
             with gr.Accordion("🎨 Visual Style (Optional)", open=True):
+                with gr.Group():
+                    image_style_input = gr.Dropdown(choices=["Default (Cinematic)"] + list(STYLE_PRESETS.keys()), value="Default (Cinematic)", label="Image Style Preset")
+                    artist_style_input = gr.Textbox(label="Artistic Inspiration (Optional):", placeholder="e.g., inspired by Van Gogh, Studio Ghibli, Syd Mead")
+                    negative_prompt_input = gr.Textbox(lines=2, label="Exclude from Image (Negative Prompt):", placeholder="e.g., blurry, text, watermark, poorly drawn hands", value=COMMON_NEGATIVE_PROMPTS)
             with gr.Accordion("⚙️ AI Configuration (Advanced)", open=False):
+                 with gr.Group():
+                    text_model_dropdown = gr.Dropdown(choices=list(TEXT_MODELS.keys()), value=UI_DEFAULT_TEXT_MODEL_KEY, label="Text Generation Model")
+                    image_provider_dropdown = gr.Dropdown(choices=list(IMAGE_PROVIDERS.keys()), value=UI_DEFAULT_IMAGE_PROVIDER_KEY, label="Image Generation Provider")
+            with gr.Row(elem_classes=["compact-row"], equal_height=True):
+                add_scene_button = gr.Button("➕ Weave Next Scene", variant="primary", scale=2)
+                clear_story_button = gr.Button("🗑️ New Story", variant="secondary", scale=1)
+            status_bar_output = gr.HTML(value="<p class='processing_text status_text'>Ready to weave your first scene!</p>")
         # --- STORY DISPLAY (Outputs) ---
+        with gr.Column(scale=3, min_width=600): # Adjusted scale
+            gr.Markdown("### 📖 **Your StoryVerse Unfolds...**")
             with gr.Tabs():
+                with gr.TabItem("🖼️ Latest Scene", elem_id="latest_scene_tab"):
+                    with gr.Row():
+                         latest_scene_image_output = gr.Image(label="Latest Scene Image", type="pil", interactive=False, show_download_button=True, height=400, elem_classes=["panel_image"]) # Fixed height
+                    latest_scene_narrative_output = gr.Markdown(label="Latest Scene Narrative") # Markdown can render images if path is given, but here it's for text
+                with gr.TabItem("📜 Story Scroll (All Scenes)", elem_id="story_scroll_tab"):
+                    story_gallery_output = gr.Gallery(label="Story Scroll", show_label=False, columns=3, object_fit="cover", height=600, preview=True, elem_classes=["gallery_output"]) # Preview on click
+                with gr.TabItem("📝 Interaction Log", elem_id="log_tab"):
                     log_output_markdown = gr.Markdown("Log will appear here...")
     # --- Event Handlers ---
             image_style_input, artist_style_input, negative_prompt_input,
             text_model_dropdown, image_provider_dropdown
         ],
+        outputs=[
             story_state, story_gallery_output,
             latest_scene_image_output, latest_scene_narrative_output,
             status_bar_output, log_output_markdown
         ]
     )
     clear_story_button.click(
+        fn=clear_story_state_ui, # Use the UI specific clear function
         inputs=[],
         outputs=[
             story_state, story_gallery_output,
         ]
     )
     gr.Examples(
         examples=[
+            ["A knight in shining armor bravely faces a colossal, fire-breathing dragon in front of a crumbling volcano fortress.", "Fantasy Art", "Frank Frazetta", "blurry, low quality, cartoon"],
+            ["In a rain-slicked, neon-drenched cyberpunk alley, a lone detective in a trench coat examines a mysterious datachip.", "Cyberpunk", "Syd Mead", "bright daytime, nature, animals"],
+            ["Two curious children stumble upon a glowing, ancient portal hidden within the roots of a giant, moss-covered oak tree in an enchanted forest.", "Studio Ghibli Inspired", "Hayao Miyazaki", "dark, scary, urban, modern"],
+            ["A single, perfect red rose defiantly blooms amidst the metallic ruins of a desolate, post-apocalyptic cityscape under a grey sky.", "Photorealistic", "Ansel Adams", "oversaturated colors, people, vibrant"],
         ],
         inputs=[scene_prompt_input, image_style_input, artist_style_input, negative_prompt_input],
+        label="✨ Example Scene Ideas & Styles ✨",
+        # outputs=[scene_prompt_input, image_style_input, artist_style_input, negative_prompt_input] # To fill inputs
     )
+    gr.HTML("<p style='text-align:center; font-size:0.9em; color:grey; margin-top:20px;'>StoryVerse Weaver™ - Weaving Worlds with Words and Pixels</p>")
 # --- Entry Point ---
 if __name__ == "__main__":
     print("="*80)
     print("✨ StoryVerse Weaver™ - Multimodal Story Creator - Launching... ✨")
+    print(f"  Text LLM Ready (Gemini): {GEMINI_TEXT_IS_READY}") # Using corrected var names
+    print(f"  Text LLM Ready (HF): {HF_TEXT_IS_READY}")
+    print(f"  Image Provider Ready (Stability AI): {STABILITY_API_IS_READY}")
+    print(f"  Image Provider Ready (DALL-E): {OPENAI_DALLE_IS_READY}")
+    if not (GEMINI_TEXT_IS_READY or HF_TEXT_IS_READY) or \
+       not (STABILITY_API_IS_READY or OPENAI_DALLE_IS_READY):
+        print("  🔴 WARNING: Not all required AI services are configured. Functionality will be limited or fail.")
+        print("     Please set environment variables/secrets for:")
+        print("     - Text: STORYVERSE_GOOGLE_API_KEY (for Gemini) and/or STORYVERSE_HF_TOKEN (for Hugging Face models)")
+        print("     - Image: STORYVERSE_STABILITY_API_KEY (for Stability AI) and/or STORYVERSE_OPENAI_API_KEY (for DALL-E)")
+    print(f"  Default Text Model: {UI_DEFAULT_TEXT_MODEL_KEY}")
+    print(f"  Default Image Provider: {UI_DEFAULT_IMAGE_PROVIDER_KEY}")
     print(f"  Available Text Models: {list(TEXT_MODELS.keys())}")
     print(f"  Available Image Providers: {list(IMAGE_PROVIDERS.keys())}")
     print("="*80)
     story_weaver_demo.launch(debug=True, server_name="0.0.0.0")