Spaces:

gnosticdev
/

INVIDEO_BASIC

Runtime error

App Files Files Community

gnosticdev commited on 28 days ago

Commit

80b1aba

verified ·

1 Parent(s): 7b02e0f

Update app.py

Browse files

Files changed (1) hide show

app.py +14 -37

app.py CHANGED Viewed

@@ -26,14 +26,13 @@ except ImportError:
     except Exception as e:
         logger.critical(f"Fallo al instalar moviepy: {str(e)}")
         logger.info("Continuando con placeholder para pruebas...")
-        moviepy = None  # Placeholder para evitar errores
 import re
 import math
 import shutil
 import json
 from collections import Counter
-# Configuración de logging
 logging.basicConfig(
     level=logging.DEBUG,
     format='%(asctime)s - %(levelname)s - %(message)s',
@@ -46,7 +45,6 @@ logger.info("="*80)
 logger.info("INICIO DE EJECUCIÓN - GENERADOR DE VIDEOS")
 logger.info("="*80)
-# Diccionario de voces TTS disponibles organizadas por idioma
 VOCES_DISPONIBLES = {
     "Español (España)": {
         "es-ES-JuanNeural": "Juan (España) - Masculino",
@@ -109,7 +107,6 @@ VOCES_DISPONIBLES = {
     }
 }
-# Función para obtener lista plana de voces para el dropdown
 def get_voice_choices():
     choices = []
     for region, voices in VOCES_DISPONIBLES.items():
@@ -117,9 +114,8 @@ def get_voice_choices():
             choices.append((f"{voice_name} ({region})", voice_id))
     return choices
-# Obtener las voces al inicio del script
 AVAILABLE_VOICES = get_voice_choices()
-DEFAULT_VOICE_ID = "es-MX-DaliaNeural"  # Voz más estable
 DEFAULT_VOICE_NAME = DEFAULT_VOICE_ID
 for text, voice_id in AVAILABLE_VOICES:
     if voice_id == DEFAULT_VOICE_ID:
@@ -130,12 +126,10 @@ if DEFAULT_VOICE_ID not in [v[1] for v in AVAILABLE_VOICES]:
     DEFAULT_VOICE_NAME = AVAILABLE_VOICES[0][0] if AVAILABLE_VOICES else "Dalia (México) - Femenino"
 logger.info(f"Voz por defecto seleccionada (ID): {DEFAULT_VOICE_ID}")
-# Clave API de Pexels
 PEXELS_API_KEY = os.environ.get("PEXELS_API_KEY")
 if not PEXELS_API_KEY:
     logger.critical("NO SE ENCONTRÓ PEXELS_API_KEY EN VARIABLES DE ENTORNO")
-# Inicialización de modelos
 MODEL_NAME = "datificate/gpt2-small-spanish"
 logger.info(f"Inicializando modelo GPT-2: {MODEL_NAME}")
 tokenizer = None
@@ -163,7 +157,6 @@ def buscar_videos_pexels(query, api_key, per_page=5):
     if not api_key:
         logger.warning("No se puede buscar en Pexels: API Key no configurada.")
         return []
     logger.debug(f"Buscando en Pexels: '{query}' | Resultados: {per_page}")
     headers = {"Authorization": api_key}
     try:
@@ -199,10 +192,8 @@ def generate_script(prompt, max_length=150):
     if not tokenizer or not model:
         logger.warning("Modelos GPT-2 no disponibles - Usando prompt original como guion.")
         return prompt.strip()
     instruction_phrase_start = "Escribe un guion corto, interesante y coherente sobre:"
     ai_prompt = f"{instruction_phrase_start} {prompt}"
     try:
         inputs = tokenizer(ai_prompt, return_tensors="pt", truncation=True, max_length=512)
         device = torch.device("cuda" if torch.cuda.is_available() else "cpu")
@@ -263,7 +254,6 @@ async def text_to_speech(text, output_path, voice):
         logger.warning(f"edge_tts falló, intentando gTTS...")
     except Exception as e:
         logger.error(f"Error en edge_tts con voz '{voice}': {str(e)}")
     try:
         tts = gTTS(text=text, lang='es')
         tts.save(output_path)
@@ -382,15 +372,14 @@ async def crear_video_async(prompt_type, input_text, selected_voice, musica_file
     video_final = None
     source_clips = []
     clips_to_concatenate = []
     try:
-        # 1. Generar o usar guion
         guion = generate_script(input_text) if prompt_type == "Generar Guion con IA" else input_text.strip()
         logger.info(f"Guion final ({len(guion)} chars): '{guion[:100]}...'")
         if not guion.strip():
             raise ValueError("El guion está vacío.")
-        # 2. Generar audio de voz
         voz_path = os.path.join(temp_dir_intermediate, "voz.mp3")
         tts_voices_to_try = [selected_voice, "es-MX-DaliaNeural"]
         tts_success = False
@@ -444,18 +433,16 @@ async def crear_video_async(prompt_type, input_text, selected_voice, musica_file
             audio_duration = audio_tts_original.duration
         else:
             logger.warning("MoviePy no disponible, asumiendo duración mínima para audio")
-            audio_duration = 1.0  # Valor placeholder
         logger.info(f"Duración audio voz: {audio_duration:.2f} segundos")
         if audio_duration < 1.0:
             raise ValueError("Audio de voz demasiado corto.")
-        # 3. Extraer palabras clave
         keywords = extract_visual_keywords_from_script(guion)
         if not keywords:
             keywords = ["video", "background"]
         logger.info(f"Palabras clave: {keywords}")
-        # 4. Buscar y descargar videos
         videos_data = []
         total_desired_videos = 10
         per_page_per_keyword = max(1, total_desired_videos // len(keywords))
@@ -490,14 +477,13 @@ async def crear_video_async(prompt_type, input_text, selected_voice, musica_file
         if not video_paths:
             raise ValueError("No se descargaron videos utilizables.")
-        # 5. Procesar y concatenar clips de video
         if not moviepy:
             logger.warning("MoviePy no disponible, retornando placeholder...")
             output_filename = f"video_{int(datetime.now().timestamp())}.mp4"
-            persistent_path = os.path.join(temp_dir_intermediate, output_filename)
-            open(persistent_path, 'a').close()  # Crea archivo vacío como placeholder
-            download_url = f"https://gnosticdev-invideo-basic.hf.space/file={persistent_path}"
-            return persistent_path, download_url
         current_duration = 0
         min_clip_duration = 0.5
@@ -526,7 +512,6 @@ async def crear_video_async(prompt_type, input_text, selected_voice, musica_file
         if video_base.duration is None or video_base.duration <= 0:
             raise ValueError("Video base inválido.")
-        # Ajustar duración del video
         if video_base.duration < audio_duration:
             num_full_repeats = int(audio_duration // video_base.duration)
             remaining_duration = audio_duration % video_base.duration
@@ -538,7 +523,6 @@ async def crear_video_async(prompt_type, input_text, selected_voice, musica_file
         elif video_base.duration > audio_duration:
             video_base = video_base.subclip(0, audio_duration)
-        # 6. Manejar música de fondo
         final_audio = audio_tts
         if musica_file:
             try:
@@ -559,7 +543,6 @@ async def crear_video_async(prompt_type, input_text, selected_voice, musica_file
         if abs(final_audio.duration - video_base.duration) > 0.2:
             final_audio = final_audio.subclip(0, video_base.duration)
-        # 7. Combinar audio y video
         video_final = video_base.set_audio(final_audio)
         output_filename = f"video_{int(datetime.now().timestamp())}.mp4"
         output_path = os.path.join(temp_dir_intermediate, output_filename)
@@ -620,11 +603,16 @@ async def crear_video_async(prompt_type, input_text, selected_voice, musica_file
             except:
                 pass
         for path in temp_intermediate_files:
-            if os.path.isfile(path) and path != output_path:
                 try:
                     os.remove(path)
                 except:
                     logger.warning(f"No se pudo eliminar {path}")
 async def run_app_async(prompt_type, prompt_ia, prompt_manual, musica_file, selected_voice):
     logger.info("="*80)
@@ -644,10 +632,7 @@ async def run_app_async(prompt_type, prompt_ia, prompt_manual, musica_file, sele
         selected_voice = DEFAULT_VOICE_ID
     try:
-        # Crear tarea para generar video
         task = asyncio.create_task(crear_video_async(prompt_type, input_text, selected_voice, musica_file))
-        # Verificar progreso cada 5 segundos durante 10 minutos (600s)
         timeout = 600
         interval = 5
         elapsed = 0
@@ -668,8 +653,6 @@ async def run_app_async(prompt_type, prompt_ia, prompt_manual, musica_file, sele
             elapsed += interval
             status_msg = gr.update(value=f"⏳ Procesando... Tiempo transcurrido: {elapsed}s")
             logger.debug(f"Esperando video, tiempo transcurrido: {elapsed}s")
-        # Si se excede el timeout
         logger.error("Tiempo de espera excedido para la generación del video.")
         status_msg = gr.update(value="❌ Error: Tiempo de espera excedido (10 minutos).")
         task.cancel()
@@ -678,7 +661,6 @@ async def run_app_async(prompt_type, prompt_ia, prompt_manual, musica_file, sele
         except asyncio.CancelledError:
             pass
         return None, None, status_msg
     except ValueError as ve:
         logger.warning(f"Error de validación: {str(ve)}")
         status_msg = gr.update(value=f"⚠️ Error: {str(ve)}")
@@ -691,11 +673,9 @@ async def run_app_async(prompt_type, prompt_ia, prompt_manual, musica_file, sele
 def run_app(prompt_type, prompt_ia, prompt_manual, musica_file, selected_voice):
     return asyncio.run(run_app_async(prompt_type, prompt_ia, prompt_manual, musica_file, selected_voice))
-# Interfaz de Gradio
 with gr.Blocks(title="Generador de Videos con IA", theme=gr.themes.Soft()) as app:
     gr.Markdown("# 🎬 Generador Automático de Videos con IA")
     gr.Markdown("Genera videos cortos a partir de un tema o guion, usando imágenes de archivo de Pexels y voz generada.")
     with gr.Row():
         with gr.Column():
             prompt_type = gr.Radio(
@@ -746,13 +726,11 @@ with gr.Blocks(title="Generador de Videos con IA", theme=gr.themes.Soft()) as ap
                 placeholder="Esperando acción...",
                 value="Esperando entrada..."
             )
     prompt_type.change(
         fn=lambda x: (gr.update(visible=x == "Generar Guion con IA"), gr.update(visible=x == "Usar Mi Guion")),
         inputs=prompt_type,
         outputs=[ia_guion_column, manual_guion_column]
     )
     generate_btn.click(
         fn=lambda: (None, None, gr.update(value="⏳ Iniciando generación de video...")),
         outputs=[video_output, file_output, status_output]
@@ -766,7 +744,6 @@ with gr.Blocks(title="Generador de Videos con IA", theme=gr.themes.Soft()) as ap
         inputs=[video_output, file_output, status_output],
         outputs=[file_output]
     )
     gr.Markdown("### Instrucciones:")
     gr.Markdown("""
     1. Configura la variable de entorno `PEXELS_API_KEY`.

     except Exception as e:
         logger.critical(f"Fallo al instalar moviepy: {str(e)}")
         logger.info("Continuando con placeholder para pruebas...")
+        moviepy = None
 import re
 import math
 import shutil
 import json
 from collections import Counter
 logging.basicConfig(
     level=logging.DEBUG,
     format='%(asctime)s - %(levelname)s - %(message)s',
 logger.info("INICIO DE EJECUCIÓN - GENERADOR DE VIDEOS")
 logger.info("="*80)
 VOCES_DISPONIBLES = {
     "Español (España)": {
         "es-ES-JuanNeural": "Juan (España) - Masculino",
     }
 }
 def get_voice_choices():
     choices = []
     for region, voices in VOCES_DISPONIBLES.items():
             choices.append((f"{voice_name} ({region})", voice_id))
     return choices
 AVAILABLE_VOICES = get_voice_choices()
+DEFAULT_VOICE_ID = "es-MX-DaliaNeural"
 DEFAULT_VOICE_NAME = DEFAULT_VOICE_ID
 for text, voice_id in AVAILABLE_VOICES:
     if voice_id == DEFAULT_VOICE_ID:
     DEFAULT_VOICE_NAME = AVAILABLE_VOICES[0][0] if AVAILABLE_VOICES else "Dalia (México) - Femenino"
 logger.info(f"Voz por defecto seleccionada (ID): {DEFAULT_VOICE_ID}")
 PEXELS_API_KEY = os.environ.get("PEXELS_API_KEY")
 if not PEXELS_API_KEY:
     logger.critical("NO SE ENCONTRÓ PEXELS_API_KEY EN VARIABLES DE ENTORNO")
 MODEL_NAME = "datificate/gpt2-small-spanish"
 logger.info(f"Inicializando modelo GPT-2: {MODEL_NAME}")
 tokenizer = None
     if not api_key:
         logger.warning("No se puede buscar en Pexels: API Key no configurada.")
         return []
     logger.debug(f"Buscando en Pexels: '{query}' | Resultados: {per_page}")
     headers = {"Authorization": api_key}
     try:
     if not tokenizer or not model:
         logger.warning("Modelos GPT-2 no disponibles - Usando prompt original como guion.")
         return prompt.strip()
     instruction_phrase_start = "Escribe un guion corto, interesante y coherente sobre:"
     ai_prompt = f"{instruction_phrase_start} {prompt}"
     try:
         inputs = tokenizer(ai_prompt, return_tensors="pt", truncation=True, max_length=512)
         device = torch.device("cuda" if torch.cuda.is_available() else "cpu")
         logger.warning(f"edge_tts falló, intentando gTTS...")
     except Exception as e:
         logger.error(f"Error en edge_tts con voz '{voice}': {str(e)}")
     try:
         tts = gTTS(text=text, lang='es')
         tts.save(output_path)
     video_final = None
     source_clips = []
     clips_to_concatenate = []
+    output_path = None
     try:
         guion = generate_script(input_text) if prompt_type == "Generar Guion con IA" else input_text.strip()
         logger.info(f"Guion final ({len(guion)} chars): '{guion[:100]}...'")
         if not guion.strip():
             raise ValueError("El guion está vacío.")
         voz_path = os.path.join(temp_dir_intermediate, "voz.mp3")
         tts_voices_to_try = [selected_voice, "es-MX-DaliaNeural"]
         tts_success = False
             audio_duration = audio_tts_original.duration
         else:
             logger.warning("MoviePy no disponible, asumiendo duración mínima para audio")
+            audio_duration = 1.0
         logger.info(f"Duración audio voz: {audio_duration:.2f} segundos")
         if audio_duration < 1.0:
             raise ValueError("Audio de voz demasiado corto.")
         keywords = extract_visual_keywords_from_script(guion)
         if not keywords:
             keywords = ["video", "background"]
         logger.info(f"Palabras clave: {keywords}")
         videos_data = []
         total_desired_videos = 10
         per_page_per_keyword = max(1, total_desired_videos // len(keywords))
         if not video_paths:
             raise ValueError("No se descargaron videos utilizables.")
         if not moviepy:
             logger.warning("MoviePy no disponible, retornando placeholder...")
             output_filename = f"video_{int(datetime.now().timestamp())}.mp4"
+            output_path = os.path.join(temp_dir_intermediate, output_filename)
+            open(output_path, 'a').close()
+            download_url = f"https://gnosticdev-invideo-basic.hf.space/file={output_path}"
+            return output_path, download_url
         current_duration = 0
         min_clip_duration = 0.5
         if video_base.duration is None or video_base.duration <= 0:
             raise ValueError("Video base inválido.")
         if video_base.duration < audio_duration:
             num_full_repeats = int(audio_duration // video_base.duration)
             remaining_duration = audio_duration % video_base.duration
         elif video_base.duration > audio_duration:
             video_base = video_base.subclip(0, audio_duration)
         final_audio = audio_tts
         if musica_file:
             try:
         if abs(final_audio.duration - video_base.duration) > 0.2:
             final_audio = final_audio.subclip(0, video_base.duration)
         video_final = video_base.set_audio(final_audio)
         output_filename = f"video_{int(datetime.now().timestamp())}.mp4"
         output_path = os.path.join(temp_dir_intermediate, output_filename)
             except:
                 pass
         for path in temp_intermediate_files:
+            if os.path.isfile(path) and (output_path is None or path != output_path):
                 try:
                     os.remove(path)
                 except:
                     logger.warning(f"No se pudo eliminar {path}")
+        try:
+            if os.path.exists(temp_dir_intermediate) and (output_path is None or not output_path.startswith(temp_dir_intermediate)):
+                shutil.rmtree(temp_dir_intermediate)
+        except:
+            logger.warning(f"No se pudo eliminar directorio temporal {temp_dir_intermediate}")
 async def run_app_async(prompt_type, prompt_ia, prompt_manual, musica_file, selected_voice):
     logger.info("="*80)
         selected_voice = DEFAULT_VOICE_ID
     try:
         task = asyncio.create_task(crear_video_async(prompt_type, input_text, selected_voice, musica_file))
         timeout = 600
         interval = 5
         elapsed = 0
             elapsed += interval
             status_msg = gr.update(value=f"⏳ Procesando... Tiempo transcurrido: {elapsed}s")
             logger.debug(f"Esperando video, tiempo transcurrido: {elapsed}s")
         logger.error("Tiempo de espera excedido para la generación del video.")
         status_msg = gr.update(value="❌ Error: Tiempo de espera excedido (10 minutos).")
         task.cancel()
         except asyncio.CancelledError:
             pass
         return None, None, status_msg
     except ValueError as ve:
         logger.warning(f"Error de validación: {str(ve)}")
         status_msg = gr.update(value=f"⚠️ Error: {str(ve)}")
 def run_app(prompt_type, prompt_ia, prompt_manual, musica_file, selected_voice):
     return asyncio.run(run_app_async(prompt_type, prompt_ia, prompt_manual, musica_file, selected_voice))
 with gr.Blocks(title="Generador de Videos con IA", theme=gr.themes.Soft()) as app:
     gr.Markdown("# 🎬 Generador Automático de Videos con IA")
     gr.Markdown("Genera videos cortos a partir de un tema o guion, usando imágenes de archivo de Pexels y voz generada.")
     with gr.Row():
         with gr.Column():
             prompt_type = gr.Radio(
                 placeholder="Esperando acción...",
                 value="Esperando entrada..."
             )
     prompt_type.change(
         fn=lambda x: (gr.update(visible=x == "Generar Guion con IA"), gr.update(visible=x == "Usar Mi Guion")),
         inputs=prompt_type,
         outputs=[ia_guion_column, manual_guion_column]
     )
     generate_btn.click(
         fn=lambda: (None, None, gr.update(value="⏳ Iniciando generación de video...")),
         outputs=[video_output, file_output, status_output]
         inputs=[video_output, file_output, status_output],
         outputs=[file_output]
     )
     gr.Markdown("### Instrucciones:")
     gr.Markdown("""
     1. Configura la variable de entorno `PEXELS_API_KEY`.