Spaces:
Running
Running
import logging | |
from typing import Optional, List | |
# Configure logging | |
logger = logging.getLogger(__name__) | |
# Import the base class | |
from utils.tts_base import TTSEngineBase, DummyTTSEngine | |
class TTSFactory: | |
"""Factory class for creating TTS engines | |
This class is responsible for creating the appropriate TTS engine based on | |
availability and configuration. | |
""" | |
def create_engine(engine_type: Optional[str] = None, lang_code: str = 'z') -> TTSEngineBase: | |
"""Create a TTS engine instance | |
Args: | |
engine_type (str, optional): Type of engine to create ('kokoro', 'kokoro_space', 'dia', 'dummy') | |
If None, the best available engine will be used | |
lang_code (str): Language code for the engine | |
Returns: | |
TTSEngineBase: An instance of a TTS engine | |
""" | |
from utils.tts_engines import get_available_engines, create_engine | |
# Get available engines | |
available_engines = get_available_engines() | |
logger.info(f"Available TTS engines: {available_engines}") | |
# If engine_type is specified, try to create that specific engine | |
if engine_type is not None: | |
if engine_type in available_engines: | |
logger.info(f"Creating requested engine: {engine_type}") | |
return create_engine(engine_type, lang_code) | |
else: | |
logger.warning(f"Requested engine '{engine_type}' is not available") | |
# Try to create the best available engine | |
# Priority: kokoro > kokoro_space > dia > dummy | |
for engine in ['kokoro', 'kokoro_space', 'dia']: | |
if engine in available_engines: | |
logger.info(f"Creating best available engine: {engine}") | |
return create_engine(engine, lang_code) | |
# Fall back to dummy engine | |
logger.warning("No TTS engines available, falling back to dummy engine") | |
return DummyTTSEngine(lang_code) | |
# Backward compatibility function | |
def get_tts_engine(lang_code: str = 'a') -> TTSEngineBase: | |
"""Get or create TTS engine instance (backward compatibility function) | |
Args: | |
lang_code (str): Language code for the pipeline | |
Returns: | |
TTSEngineBase: Initialized TTS engine instance | |
""" | |
logger.info(f"Requesting TTS engine with language code: {lang_code}") | |
try: | |
import streamlit as st | |
logger.info("Streamlit detected, using cached TTS engine") | |
def _get_engine(): | |
logger.info("Creating cached TTS engine instance") | |
engine = TTSFactory.create_engine(lang_code=lang_code) | |
logger.info(f"Cached TTS engine created with type: {engine.__class__.__name__}") | |
return engine | |
engine = _get_engine() | |
logger.info(f"Retrieved TTS engine from cache with type: {engine.__class__.__name__}") | |
return engine | |
except ImportError: | |
logger.info("Streamlit not available, creating direct TTS engine instance") | |
engine = TTSFactory.create_engine(lang_code=lang_code) | |
logger.info(f"Direct TTS engine created with type: {engine.__class__.__name__}") | |
return engine | |
# Backward compatibility function | |
def generate_speech(text: str, voice: str = 'af_heart', speed: float = 1.0) -> str: | |
"""Public interface for TTS generation (backward compatibility function) | |
Args: | |
text (str): Input text to synthesize | |
voice (str): Voice ID to use | |
speed (float): Speech speed multiplier | |
Returns: | |
str: Path to generated audio file | |
""" | |
logger.info(f"Public generate_speech called with text length: {len(text)}, voice: {voice}, speed: {speed}") | |
try: | |
# Get the TTS engine | |
logger.info("Getting TTS engine instance") | |
engine = get_tts_engine() | |
logger.info(f"Using TTS engine type: {engine.__class__.__name__}") | |
# Generate speech | |
logger.info("Calling engine.generate_speech") | |
output_path = engine.generate_speech(text, voice, speed) | |
logger.info(f"Speech generation complete, output path: {output_path}") | |
return output_path | |
except Exception as e: | |
logger.error(f"Error in public generate_speech function: {str(e)}", exc_info=True) | |
logger.error(f"Error type: {type(e).__name__}") | |
if hasattr(e, '__traceback__'): | |
tb = e.__traceback__ | |
while tb.tb_next: | |
tb = tb.tb_next | |
logger.error(f"Error occurred in file: {tb.tb_frame.f_code.co_filename}, line {tb.tb_lineno}") | |
raise |