Spaces:
Configuration error
Configuration error
Merge branch 'main' of https://github.com/SWivid/F5-TTS
Browse files- gradio_app.py +1 -2
- inference-cli.py +1 -2
gradio_app.py
CHANGED
@@ -46,6 +46,7 @@ pipe = pipeline(
|
|
46 |
torch_dtype=torch.float16,
|
47 |
device=device,
|
48 |
)
|
|
|
49 |
|
50 |
# --------------------- Settings -------------------- #
|
51 |
|
@@ -243,8 +244,6 @@ def infer_batch(ref_audio, ref_text, gen_text_batches, exp_name, remove_silence,
|
|
243 |
|
244 |
generated = generated[:, ref_audio_len:, :]
|
245 |
generated_mel_spec = rearrange(generated, "1 n d -> 1 d n")
|
246 |
-
|
247 |
-
vocos = Vocos.from_pretrained("charactr/vocos-mel-24khz")
|
248 |
generated_wave = vocos.decode(generated_mel_spec.cpu())
|
249 |
if rms < target_rms:
|
250 |
generated_wave = generated_wave * rms / target_rms
|
|
|
46 |
torch_dtype=torch.float16,
|
47 |
device=device,
|
48 |
)
|
49 |
+
vocos = Vocos.from_pretrained("charactr/vocos-mel-24khz")
|
50 |
|
51 |
# --------------------- Settings -------------------- #
|
52 |
|
|
|
244 |
|
245 |
generated = generated[:, ref_audio_len:, :]
|
246 |
generated_mel_spec = rearrange(generated, "1 n d -> 1 d n")
|
|
|
|
|
247 |
generated_wave = vocos.decode(generated_mel_spec.cpu())
|
248 |
if rms < target_rms:
|
249 |
generated_wave = generated_wave * rms / target_rms
|
inference-cli.py
CHANGED
@@ -95,6 +95,7 @@ device = (
|
|
95 |
if torch.cuda.is_available()
|
96 |
else "mps" if torch.backends.mps.is_available() else "cpu"
|
97 |
)
|
|
|
98 |
|
99 |
print(f"Using {device} device")
|
100 |
|
@@ -286,8 +287,6 @@ def infer_batch(ref_audio, ref_text, gen_text_batches, model, remove_silence):
|
|
286 |
|
287 |
generated = generated[:, ref_audio_len:, :]
|
288 |
generated_mel_spec = rearrange(generated, "1 n d -> 1 d n")
|
289 |
-
|
290 |
-
vocos = Vocos.from_pretrained("charactr/vocos-mel-24khz")
|
291 |
generated_wave = vocos.decode(generated_mel_spec.cpu())
|
292 |
if rms < target_rms:
|
293 |
generated_wave = generated_wave * rms / target_rms
|
|
|
95 |
if torch.cuda.is_available()
|
96 |
else "mps" if torch.backends.mps.is_available() else "cpu"
|
97 |
)
|
98 |
+
vocos = Vocos.from_pretrained("charactr/vocos-mel-24khz")
|
99 |
|
100 |
print(f"Using {device} device")
|
101 |
|
|
|
287 |
|
288 |
generated = generated[:, ref_audio_len:, :]
|
289 |
generated_mel_spec = rearrange(generated, "1 n d -> 1 d n")
|
|
|
|
|
290 |
generated_wave = vocos.decode(generated_mel_spec.cpu())
|
291 |
if rms < target_rms:
|
292 |
generated_wave = generated_wave * rms / target_rms
|