TTS_API_Image_fallback

Sleeping

App Files Files Community

khurrameycon commited on Apr 6

Commit

44d8d66

verified ·

1 Parent(s): 1570ec4

Update app.py

Browse files

Files changed (1) hide show

app.py +12 -16

app.py CHANGED Viewed

@@ -105,10 +105,8 @@ from huggingface_hub import InferenceClient
 from pydantic import BaseModel
 import base64
 import logging
-from typing import Optional
-import uuid
 from typing import Optional, ClassVar, List
 # Set up logging
 logging.basicConfig(level=logging.INFO)
@@ -117,10 +115,10 @@ logger = logging.getLogger(__name__)
 class TextImageRequest(BaseModel):
     text: Optional[str] = None
     image_base64: Optional[str] = None
-    voice: str = "af_heart"  # Default voice
     speed: float = 1.0
-    # Annotate as ClassVar to indicate this is not a model field.
     AVAILABLE_VOICES: ClassVar[List[str]] = ["af_heart"]
     def validate_voice(self):
@@ -160,7 +158,7 @@ def llm_chat_response(text, image_base64=None):
         logger.info("Initializing InferenceClient...")
         client = InferenceClient(
-            provider="hf-inference",  # Using correct provider as per sample
             api_key=HF_TOKEN
         )
@@ -180,20 +178,17 @@ def llm_chat_response(text, image_base64=None):
             base_url = os.getenv("BASE_URL", "http://localhost:8000")
             image_url = f"{base_url}/static/{filename}"
             prompt = text if text else "Describe this image in one sentence."
             messages = [
                 {
                     "role": "user",
                     "content": [
-                        {
-                            "type": "text",
-                            "text": prompt
-                        },
-                        {
-                            "type": "image_url",
-                            "image_url": {
-                                "url": image_url
-                            }
-                        }
                     ]
                 }
             ]
@@ -344,3 +339,4 @@ async def method_not_allowed_handler(request: Request, exc):
         status_code=405,
         content={"error": "Method not allowed. Please check the API documentation."}
     )

 from pydantic import BaseModel
 import base64
 import logging
 from typing import Optional, ClassVar, List
+import uuid
 # Set up logging
 logging.basicConfig(level=logging.INFO)
 class TextImageRequest(BaseModel):
     text: Optional[str] = None
     image_base64: Optional[str] = None
+    voice: str = "af_heart"  # Default voice that we know exists
     speed: float = 1.0
+    # Annotated as a ClassVar so Pydantic doesn't treat it as a model field.
     AVAILABLE_VOICES: ClassVar[List[str]] = ["af_heart"]
     def validate_voice(self):
         logger.info("Initializing InferenceClient...")
         client = InferenceClient(
+            provider="hf-inference",  # Using the correct provider
             api_key=HF_TOKEN
         )
             base_url = os.getenv("BASE_URL", "http://localhost:8000")
             image_url = f"{base_url}/static/{filename}"
             prompt = text if text else "Describe this image in one sentence."
+            # Include a system message to provide conversation context
             messages = [
+                {
+                    "role": "system",
+                    "content": "You are a helpful assistant that describes images and answers questions about them."
+                },
                 {
                     "role": "user",
                     "content": [
+                        {"type": "text", "text": prompt},
+                        {"type": "image_url", "image_url": {"url": image_url}}
                     ]
                 }
             ]
         status_code=405,
         content={"error": "Method not allowed. Please check the API documentation."}
     )