Spaces:

BricksDisplay
/

OuteTTS-Speaker-Creator

Sleeping

App Files Files Community

hans00 commited on Jul 6

Commit

a6b9820

unverified ·

1 Parent(s): e72b0a5

Fix work for models < 1.0

Browse files

Files changed (1) hide show

app.py +43 -8

app.py CHANGED Viewed

@@ -8,6 +8,9 @@ import hashlib
 import os
 from functools import lru_cache
 from typing import Optional
 # Available OuteTTS models based on the documentation
 MODELS = {v.value: v for _, v in outetts.Models.__members__.items()}
@@ -23,17 +26,48 @@ def get_file_hash(file_path):
             hash_md5.update(chunk)
     return hash_md5.hexdigest()
 @lru_cache(maxsize=5)
 def get_cached_interface(model_name: str):
     """Get cached interface instance for the model."""
     model = MODELS[model_name]
-    # Configure the model
-    config = outetts.ModelConfig.auto_config(
-        model=model,
-        backend=outetts.Backend.LLAMACPP,
-        quantization=outetts.LlamaCppQuantization.Q6_K,
-    )
     # Initialize the interface
     interface = outetts.Interface(config=config)
@@ -84,7 +118,8 @@ def create_speaker_and_generate(model_name, audio_file, test_text: Optional[str]
                 speaker=speaker,
                 sampler_config=outetts.SamplerConfig(
                     temperature=temperature
-                )
             )
         )

 import os
 from functools import lru_cache
 from typing import Optional
+from outetts.models.info import MODEL_INFO
+from outetts.utils import helpers
+from huggingface_hub import hf_hub_download
 # Available OuteTTS models based on the documentation
 MODELS = {v.value: v for _, v in outetts.Models.__members__.items()}
             hash_md5.update(chunk)
     return hash_md5.hexdigest()
+def try_auto_model_config(model: outetts.Models, backend: outetts.Backend, quantization: outetts.LlamaCppQuantization):
+    model_config = MODEL_INFO[model]
+    try:
+        repo = f"OuteAI/{model.value}-GGUF"
+        filename = f"{model.value}-{quantization.value}.gguf"
+        model_path = hf_hub_download(
+            repo_id=repo,
+            filename=filename,
+            local_dir=os.path.join(helpers.get_cache_dir(), "gguf"),
+            local_files_only=False
+        )
+        return outetts.ModelConfig(
+            model_path=model_path,
+            tokenizer_path=f"OuteAI/{model.value}",
+            backend=backend,
+            n_gpu_layers=99,
+            verbose=False,
+            device=None,
+            dtype=None,
+            additional_model_config={},
+            audio_codec_path=None,
+            **model_config
+        )
+    except Exception as e:
+        print(f"Error: {e}")
+        return None
 @lru_cache(maxsize=5)
 def get_cached_interface(model_name: str):
     """Get cached interface instance for the model."""
     model = MODELS[model_name]
+    config = try_auto_model_config(model, outetts.Backend.LLAMACPP, outetts.LlamaCppQuantization.Q6_K)
+    if not config:
+        # Fallback to HF model
+        model_config = MODEL_INFO[model]
+        config = outetts.ModelConfig(
+            model_path=f"OuteAI/{model_name}",
+            tokenizer_path=f"OuteAI/{model_name}",
+            backend=outetts.Backend.HF,
+            **model_config
+        )
     # Initialize the interface
     interface = outetts.Interface(config=config)
                 speaker=speaker,
                 sampler_config=outetts.SamplerConfig(
                     temperature=temperature
+                ),
+                max_length=MODEL_INFO[MODELS[model_name]]["max_seq_length"]
             )
         )