Spaces:

mgbam
/

ChronoWeave

Sleeping

App Files Files Community

mgbam commited on Apr 15

Commit

2344b77

verified ·

1 Parent(s): 219ad6e

Update app.py

Browse files

Files changed (1) hide show

app.py +13 -16

app.py CHANGED Viewed

@@ -17,7 +17,7 @@ import contextlib
 import asyncio
 import uuid  # For unique identifiers
 import shutil  # For directory operations
-import logging  # For logging
 # Image handling
 from PIL import Image
@@ -36,7 +36,7 @@ import typing_extensions as typing
 import nest_asyncio
 nest_asyncio.apply()
-# Import Vertex AI SDK and service account credentials support
 import vertexai
 from vertexai.preview.vision_models import ImageGenerationModel
 from google.oauth2 import service_account
@@ -84,14 +84,13 @@ except KeyError:
         st.error("🚨 **Google API Key Not Found!** Please configure it.", icon="🚨")
         st.stop()
-# Vertex AI configuration: PROJECT_ID and LOCATION
 PROJECT_ID = st.secrets.get("PROJECT_ID") or os.environ.get("PROJECT_ID")
 LOCATION = st.secrets.get("LOCATION") or os.environ.get("LOCATION", "us-central1")
 if not PROJECT_ID:
     st.error("🚨 **PROJECT_ID not set!** Please add PROJECT_ID to your secrets.", icon="🚨")
     st.stop()
-# Load service account JSON from the secret
 try:
     service_account_info = json.loads(os.environ["SERVICE_ACCOUNT_JSON"])
     credentials = service_account.Credentials.from_service_account_info(service_account_info)
@@ -175,7 +174,6 @@ def wave_file_writer(filename: str, channels: int = 1, rate: int = AUDIO_SAMPLIN
                 logger.error(f"Error closing wave file {filename}: {e_close}")
 # --- Audio Generation using gTTS ---
-# We replace the previous failing method with gTTS.
 async def generate_audio_live_async(api_text: str, output_filename: str, voice: Optional[str] = None) -> Optional[str]:
     """
     Generates audio using gTTS (Google Text-to-Speech).
@@ -184,16 +182,18 @@ async def generate_audio_live_async(api_text: str, output_filename: str, voice:
     task_id = os.path.basename(output_filename).split('.')[0]
     logger.info(f"🎙️ [{task_id}] Generating audio via gTTS for text: '{api_text[:60]}...'")
     try:
-        # Generate audio using gTTS
         tts = gTTS(text=api_text, lang="en")
-        # Replace .wav with .mp3
         mp3_filename = output_filename.replace(".wav", ".mp3")
         tts.save(mp3_filename)
         logger.info(f"✅ [{task_id}] Audio saved: {os.path.basename(mp3_filename)}")
         return mp3_filename
     except Exception as e:
         logger.exception(f"❌ [{task_id}] Audio generation error: {e}")
-        st.error(f"Audio generation failed for {task_id}: {e}", icon="🔊")
         return None
 def generate_story_sequence_chrono(theme: str, num_scenes: int, num_timelines: int, divergence_prompt: str = "") -> Optional[ChronoWeaveResponse]:
@@ -258,8 +258,8 @@ def generate_image_imagen(prompt: str, aspect_ratio: str = "1:1", task_id: str =
     """
     Generates an image using Vertex AI's Imagen model via the Vertex AI preview API.
-    This function loads the pretrained Imagen model "imagen-3.0-generate-002" and generates an image.
-    If authentication fails, it provides guidance on how to resolve the issue.
     """
     logger.info(f"🖼️ [{task_id}] Requesting image: '{prompt[:70]}...' (Aspect: {aspect_ratio})")
     try:
@@ -278,12 +278,10 @@ def generate_image_imagen(prompt: str, aspect_ratio: str = "1:1", task_id: str =
         return image
     except Exception as e:
         error_str = str(e)
-        if "Unable to authenticate" in error_str:
             error_msg = (
-                "Authentication error: Unable to authenticate your request. "
-                "Ensure your service account JSON is loaded correctly. "
-                "For example, on Hugging Face Spaces, set SERVICE_ACCOUNT_JSON in your repository secrets. "
-                "If running locally, run `!gcloud auth login`."
             )
         else:
             error_msg = f"Image generation for {task_id} failed: {e}"
@@ -382,7 +380,6 @@ if generate_button:
                         generated_audio_path: Optional[str] = None
                         if not scene_has_error:
                             with st.spinner(f"[{task_id}] Generating audio... 🔊"):
-                                # Change output extension to .wav for consistency, but gTTS returns MP3
                                 audio_path_temp = os.path.join(temp_dir, f"{task_id}_audio.wav")
                                 try:
                                     generated_audio_path = asyncio.run(generate_audio_live_async(segment.audio_text, audio_path_temp, audio_voice))

 import asyncio
 import uuid  # For unique identifiers
 import shutil  # For directory operations
+import logging
 # Image handling
 from PIL import Image
 import nest_asyncio
 nest_asyncio.apply()
+# Import Vertex AI SDK and Google service account credentials support
 import vertexai
 from vertexai.preview.vision_models import ImageGenerationModel
 from google.oauth2 import service_account
         st.error("🚨 **Google API Key Not Found!** Please configure it.", icon="🚨")
         st.stop()
 PROJECT_ID = st.secrets.get("PROJECT_ID") or os.environ.get("PROJECT_ID")
 LOCATION = st.secrets.get("LOCATION") or os.environ.get("LOCATION", "us-central1")
 if not PROJECT_ID:
     st.error("🚨 **PROJECT_ID not set!** Please add PROJECT_ID to your secrets.", icon="🚨")
     st.stop()
+# Load service account JSON from secret and create credentials
 try:
     service_account_info = json.loads(os.environ["SERVICE_ACCOUNT_JSON"])
     credentials = service_account.Credentials.from_service_account_info(service_account_info)
                 logger.error(f"Error closing wave file {filename}: {e_close}")
 # --- Audio Generation using gTTS ---
 async def generate_audio_live_async(api_text: str, output_filename: str, voice: Optional[str] = None) -> Optional[str]:
     """
     Generates audio using gTTS (Google Text-to-Speech).
     task_id = os.path.basename(output_filename).split('.')[0]
     logger.info(f"🎙️ [{task_id}] Generating audio via gTTS for text: '{api_text[:60]}...'")
     try:
         tts = gTTS(text=api_text, lang="en")
         mp3_filename = output_filename.replace(".wav", ".mp3")
         tts.save(mp3_filename)
         logger.info(f"✅ [{task_id}] Audio saved: {os.path.basename(mp3_filename)}")
         return mp3_filename
     except Exception as e:
+        error_str = str(e)
+        if "429" in error_str:
+            st.error(f"Audio generation for {task_id} failed: 429 Too Many Requests from TTS API. Please try again later.", icon="🔊")
+        else:
+            st.error(f"Audio generation for {task_id} failed: {e}", icon="🔊")
         logger.exception(f"❌ [{task_id}] Audio generation error: {e}")
         return None
 def generate_story_sequence_chrono(theme: str, num_scenes: int, num_timelines: int, divergence_prompt: str = "") -> Optional[ChronoWeaveResponse]:
     """
     Generates an image using Vertex AI's Imagen model via the Vertex AI preview API.
+    Loads the pretrained Imagen model and attempts to generate an image.
+    If a quota exceeded error occurs, it informs you to request a quota increase.
     """
     logger.info(f"🖼️ [{task_id}] Requesting image: '{prompt[:70]}...' (Aspect: {aspect_ratio})")
     try:
         return image
     except Exception as e:
         error_str = str(e)
+        if "Quota exceeded" in error_str:
             error_msg = (
+                "Quota exceeded for image generation requests. "
+                "Please submit a quota increase request via the Vertex AI console: https://cloud.google.com/vertex-ai/docs/generative-ai/quotas-genai"
             )
         else:
             error_msg = f"Image generation for {task_id} failed: {e}"
                         generated_audio_path: Optional[str] = None
                         if not scene_has_error:
                             with st.spinner(f"[{task_id}] Generating audio... 🔊"):
                                 audio_path_temp = os.path.join(temp_dir, f"{task_id}_audio.wav")
                                 try:
                                     generated_audio_path = asyncio.run(generate_audio_live_async(segment.audio_text, audio_path_temp, audio_voice))