Spaces:

mgbam
/

my-video-app

Sleeping

App Files Files Community

mgbam commited on Jul 20

Commit

8b30fd7

verified ·

1 Parent(s): 2bfad86

Update app.py

Browse files

Files changed (1) hide show

app.py +20 -43

app.py CHANGED Viewed

@@ -1,27 +1,29 @@
 import gradio as gr
 import os
 import google.generativeai as genai
-import elevenlabs
 from tavily import TavilyClient
-import requests  # For Runway API calls
 import subprocess
 import json
 import time
 import random
 # --- 1. CONFIGURE API KEYS FROM HUGGING FACE SECRETS ---
-# Ensure you have set these in your Space's settings -> secrets
 try:
     genai.configure(api_key=os.environ["GEMINI_API_KEY"])
-    elevenlabs.set_api_key(os.environ["ELEVENLABS_API_KEY"])
     tavily_client = TavilyClient(api_key=os.environ["TAVILY_API_KEY"])
     RUNWAY_API_KEY = os.environ["RUNWAY_API_KEY"]
 except KeyError as e:
     raise ValueError(f"API Key Error: Please set the {e} secret in your Hugging Face Space settings.")
 # --- 2. DEFINE API ENDPOINTS AND HEADERS ---
-# NOTE: Check the latest RunwayML API documentation for the correct endpoint. This is a common one.
-RUNWAY_API_URL = "https://api.runwayml.com/v1/jobs"
 RUNWAY_HEADERS = {
     "Authorization": f"Bearer {RUNWAY_API_KEY}",
     "Content-Type": "application/json"
@@ -29,12 +31,6 @@ RUNWAY_HEADERS = {
 # --- 3. THE CORE VIDEO GENERATION FUNCTION ---
 def generate_video_from_topic(topic_prompt, progress=gr.Progress(track_tqdm=True)):
-    """
-    Main function to orchestrate the video generation pipeline.
-    It takes a topic and returns the path to the final generated video.
-    """
-    # Use a unique ID for this job to prevent file collisions
     job_id = f"{int(time.time())}_{random.randint(1000, 9999)}"
     print(f"--- Starting New Job: {job_id} for topic: '{topic_prompt}' ---")
@@ -64,22 +60,10 @@ def generate_video_from_topic(topic_prompt, progress=gr.Progress(track_tqdm=True
         Your output MUST be a valid JSON object with two keys:
         1. "narration_script": A string containing the full voiceover narration. Make it engaging and concise.
         2. "scene_prompts": A list of exactly 4 strings. Each string must be a highly detailed, visually rich, and cinematic prompt for a text-to-video AI like Runway Gen-2. Describe camera angles, lighting, and mood.
-        Example JSON format:
-        {{
-          "narration_script": "Did you know the ocean's depths hold more history than all the world's museums combined? Let's dive in...",
-          "scene_prompts": [
-            "An ultra-realistic, cinematic shot of a massive blue whale gliding through deep, sun-dappled ocean water, camera tracking smoothly alongside it.",
-            "A dramatic, slow-motion close-up of an ancient shipwreck on the seabed, covered in coral, with schools of small fish swimming through its broken hull.",
-            "A bioluminescent jellyfish pulsing with ethereal light in the pitch-black abyss, shot with a macro lens.",
-            "A wide, epic shot of a volcanic vent on the ocean floor erupting with dark smoke, viewed from a safe distance, creating a sense of immense power."
-          ]
-        }}
         """
         response = gemini_model.generate_content(prompt)
         try:
-            # Clean the response text before parsing
             cleaned_text = response.text.strip().replace("```json", "").replace("```", "")
             script_data = json.loads(cleaned_text)
             narration = script_data['narration_script']
@@ -92,30 +76,32 @@ def generate_video_from_topic(topic_prompt, progress=gr.Progress(track_tqdm=True
         progress(0.3, desc="🎙️ Recording voiceover with ElevenLabs...")
         audio_path = f"audio_{job_id}.mp3"
         intermediate_files.append(audio_path)
-        audio_bytes = elevenlabs.generate(text=narration, voice="Adam", model="eleven_multilingual_v2")
         with open(audio_path, "wb") as f:
             f.write(audio_bytes)
         print(f"Audio file saved: {audio_path}")
-        # STEP 4: VISUALS (Runway) - This is the most complex step
         video_clip_paths = []
         for i, scene_prompt in enumerate(scene_prompts):
             progress(0.4 + (i * 0.12), desc=f"🎬 Generating video scene {i+1}/{len(scene_prompts)}...")
-            # A. Start the generation job
             runway_payload = {"text_prompt": scene_prompt}
             post_response = requests.post(RUNWAY_API_URL, headers=RUNWAY_HEADERS, json=runway_payload)
             if post_response.status_code != 200:
                 raise gr.Error(f"Runway API Error (start job): {post_response.status_code} - {post_response.text}")
-            job_details = post_response.json()
-            task_id = job_details.get("uuid")
             if not task_id:
-                raise gr.Error(f"Runway API did not return a task UUID. Response: {job_details}")
-            # B. Poll for job completion
             video_url = None
-            for _ in range(60): # Poll for up to 10 minutes (60 * 10s)
                 get_response = requests.get(f"{RUNWAY_API_URL}/{task_id}", headers=RUNWAY_HEADERS)
                 status_details = get_response.json()
                 status = status_details.get("status")
@@ -130,9 +116,8 @@ def generate_video_from_topic(topic_prompt, progress=gr.Progress(track_tqdm=True
                 time.sleep(10)
             if not video_url:
-                raise gr.Error(f"Runway job timed out after 10 minutes for scene {i+1}.")
-            # C. Download the generated video
             clip_path = f"scene_{i+1}_{job_id}.mp4"
             intermediate_files.append(clip_path)
             video_clip_paths.append(clip_path)
@@ -145,22 +130,17 @@ def generate_video_from_topic(topic_prompt, progress=gr.Progress(track_tqdm=True
         # STEP 5: STITCHING (FFmpeg)
         progress(0.9, desc="✂️ Assembling final video with FFmpeg...")
-        # Create a file list for ffmpeg
         file_list_path = f"file_list_{job_id}.txt"
         intermediate_files.append(file_list_path)
         with open(file_list_path, "w") as f:
             for clip in video_clip_paths:
                 f.write(f"file '{clip}'\n")
-        # Concatenate video clips
         combined_video_path = f"combined_video_{job_id}.mp4"
         intermediate_files.append(combined_video_path)
         subprocess.run(['ffmpeg', '-f', 'concat', '-safe', '0', '-i', file_list_path, '-c', 'copy', combined_video_path, '-y'], check=True)
-        # Add audio to the combined video
         final_video_path = f"final_video_{job_id}.mp4"
-        # We don't add this to intermediate files because we want to keep it
         subprocess.run([
             'ffmpeg', '-i', combined_video_path, '-i', audio_path, '-c:v', 'copy',
             '-c:a', 'aac', '-shortest', final_video_path, '-y'
@@ -171,20 +151,17 @@ def generate_video_from_topic(topic_prompt, progress=gr.Progress(track_tqdm=True
         return final_video_path
     except Exception as e:
-        # If anything goes wrong, raise a Gradio error to display it in the UI
         print(f"--- JOB {job_id} FAILED --- \nError: {e}")
         raise gr.Error(f"An error occurred: {e}")
     finally:
         # STEP 6: CLEANUP
-        # Clean up all the temporary files we created
         print("Cleaning up intermediate files...")
         for file_path in intermediate_files:
             if os.path.exists(file_path):
                 os.remove(file_path)
                 print(f"Removed: {file_path}")
 # --- 4. CREATE AND LAUNCH THE GRADIO INTERFACE ---
 with gr.Blocks(theme=gr.themes.Soft()) as demo:
     gr.Markdown(

 import gradio as gr
 import os
 import google.generativeai as genai
+# --- CHANGE 1: Import the new ElevenLabs client ---
+from elevenlabs.client import ElevenLabs
 from tavily import TavilyClient
+import requests
 import subprocess
 import json
 import time
 import random
 # --- 1. CONFIGURE API KEYS FROM HUGGING FACE SECRETS ---
 try:
     genai.configure(api_key=os.environ["GEMINI_API_KEY"])
     tavily_client = TavilyClient(api_key=os.environ["TAVILY_API_KEY"])
     RUNWAY_API_KEY = os.environ["RUNWAY_API_KEY"]
+    # --- CHANGE 2: Create an instance of the ElevenLabs client ---
+    elevenlabs_client = ElevenLabs(api_key=os.environ["ELEVENLABS_API_KEY"])
 except KeyError as e:
     raise ValueError(f"API Key Error: Please set the {e} secret in your Hugging Face Space settings.")
 # --- 2. DEFINE API ENDPOINTS AND HEADERS ---
+RUNWAY_API_URL = "https://api.runwayml.com/v1/jobs"
 RUNWAY_HEADERS = {
     "Authorization": f"Bearer {RUNWAY_API_KEY}",
     "Content-Type": "application/json"
 # --- 3. THE CORE VIDEO GENERATION FUNCTION ---
 def generate_video_from_topic(topic_prompt, progress=gr.Progress(track_tqdm=True)):
     job_id = f"{int(time.time())}_{random.randint(1000, 9999)}"
     print(f"--- Starting New Job: {job_id} for topic: '{topic_prompt}' ---")
         Your output MUST be a valid JSON object with two keys:
         1. "narration_script": A string containing the full voiceover narration. Make it engaging and concise.
         2. "scene_prompts": A list of exactly 4 strings. Each string must be a highly detailed, visually rich, and cinematic prompt for a text-to-video AI like Runway Gen-2. Describe camera angles, lighting, and mood.
         """
         response = gemini_model.generate_content(prompt)
         try:
             cleaned_text = response.text.strip().replace("```json", "").replace("```", "")
             script_data = json.loads(cleaned_text)
             narration = script_data['narration_script']
         progress(0.3, desc="🎙️ Recording voiceover with ElevenLabs...")
         audio_path = f"audio_{job_id}.mp3"
         intermediate_files.append(audio_path)
+        # --- CHANGE 3: Use the client instance to generate audio ---
+        audio_bytes = elevenlabs_client.generate(
+            text=narration,
+            voice="Adam",
+            model="eleven_multilingual_v2"
+        )
         with open(audio_path, "wb") as f:
             f.write(audio_bytes)
         print(f"Audio file saved: {audio_path}")
+        # STEP 4: VISUALS (Runway)
         video_clip_paths = []
         for i, scene_prompt in enumerate(scene_prompts):
             progress(0.4 + (i * 0.12), desc=f"🎬 Generating video scene {i+1}/{len(scene_prompts)}...")
             runway_payload = {"text_prompt": scene_prompt}
             post_response = requests.post(RUNWAY_API_URL, headers=RUNWAY_HEADERS, json=runway_payload)
             if post_response.status_code != 200:
                 raise gr.Error(f"Runway API Error (start job): {post_response.status_code} - {post_response.text}")
+            task_id = post_response.json().get("uuid")
             if not task_id:
+                raise gr.Error(f"Runway API did not return a task UUID. Response: {post_response.json()}")
             video_url = None
+            for _ in range(60):
                 get_response = requests.get(f"{RUNWAY_API_URL}/{task_id}", headers=RUNWAY_HEADERS)
                 status_details = get_response.json()
                 status = status_details.get("status")
                 time.sleep(10)
             if not video_url:
+                raise gr.Error(f"Runway job timed out for scene {i+1}.")
             clip_path = f"scene_{i+1}_{job_id}.mp4"
             intermediate_files.append(clip_path)
             video_clip_paths.append(clip_path)
         # STEP 5: STITCHING (FFmpeg)
         progress(0.9, desc="✂️ Assembling final video with FFmpeg...")
         file_list_path = f"file_list_{job_id}.txt"
         intermediate_files.append(file_list_path)
         with open(file_list_path, "w") as f:
             for clip in video_clip_paths:
                 f.write(f"file '{clip}'\n")
         combined_video_path = f"combined_video_{job_id}.mp4"
         intermediate_files.append(combined_video_path)
         subprocess.run(['ffmpeg', '-f', 'concat', '-safe', '0', '-i', file_list_path, '-c', 'copy', combined_video_path, '-y'], check=True)
         final_video_path = f"final_video_{job_id}.mp4"
         subprocess.run([
             'ffmpeg', '-i', combined_video_path, '-i', audio_path, '-c:v', 'copy',
             '-c:a', 'aac', '-shortest', final_video_path, '-y'
         return final_video_path
     except Exception as e:
         print(f"--- JOB {job_id} FAILED --- \nError: {e}")
         raise gr.Error(f"An error occurred: {e}")
     finally:
         # STEP 6: CLEANUP
         print("Cleaning up intermediate files...")
         for file_path in intermediate_files:
             if os.path.exists(file_path):
                 os.remove(file_path)
                 print(f"Removed: {file_path}")
 # --- 4. CREATE AND LAUNCH THE GRADIO INTERFACE ---
 with gr.Blocks(theme=gr.themes.Soft()) as demo:
     gr.Markdown(