Spaces:

lalalic
/

xtts

Sleeping

lalalic commited on Mar 27, 2024

Commit

bc1d7a3

verified ·

1 Parent(s): ababc28

Update xtts.py

Files changed (1) hide show

xtts.py CHANGED Viewed

@@ -30,24 +30,10 @@ if not os.path.exists(sample_root):
     os.makedirs(sample_root)
 default_sample=f'{os.path.dirname(os.path.abspath(__file__))}/sample.wav', f'{sample_root}/sample.pt'
 ffmpeg=f'{os.path.dirname(os.path.abspath(__file__))}/ffmpeg'
-try:
-    st = os.stat(ffmpeg)
-    os.chmod(ffmpeg, st.st_mode | stat.S_IEXEC)
-except:
-    traceback.print_exc()
 tts=None
 model=None
-model_name="tts_models/multilingual/multi-dataset/xtts_v2"
-try:
-    tts = TTS(model_name=model_name)
-    model=tts.synthesizer.tts_model
-except:
-    traceback.print_exc()
 @app.route("/convert")
 def predict():
     global tts
@@ -66,12 +52,13 @@ def predict():
         if tts is None:
             TTS=import_module("TTS.api").TTS
             model_name="tts_models/multilingual/multi-dataset/xtts_v2"
-            tts = TTS(model_name=model_name)
             model=tts.synthesizer.tts_model
-        if not hasattr(model, '__get_conditioning_latents'):
             #hack to use cache
             model.__get_conditioning_latents=model.get_conditioning_latents
             model.get_conditioning_latents=get_conditioning_latents
         wav = tts.tts(
             text,

     os.makedirs(sample_root)
 default_sample=f'{os.path.dirname(os.path.abspath(__file__))}/sample.wav', f'{sample_root}/sample.pt'
 ffmpeg=f'{os.path.dirname(os.path.abspath(__file__))}/ffmpeg'
 tts=None
 model=None
 @app.route("/convert")
 def predict():
     global tts
         if tts is None:
             TTS=import_module("TTS.api").TTS
             model_name="tts_models/multilingual/multi-dataset/xtts_v2"
+            print(f"loading model {model_name} ...")
+            tts = TTS(model_name=model_name, progress_bar=False)
             model=tts.synthesizer.tts_model
             #hack to use cache
             model.__get_conditioning_latents=model.get_conditioning_latents
             model.get_conditioning_latents=get_conditioning_latents
+            print("model is ready")
         wav = tts.tts(
             text,