AWAS666 commited on
Commit
664533a
·
2 Parent(s): ff4e797 f2b892a

Merge branch 'main' of https://github.com/SWivid/F5-TTS

Browse files
Files changed (2) hide show
  1. gradio_app.py +1 -2
  2. inference-cli.py +1 -2
gradio_app.py CHANGED
@@ -46,6 +46,7 @@ pipe = pipeline(
46
  torch_dtype=torch.float16,
47
  device=device,
48
  )
 
49
 
50
  # --------------------- Settings -------------------- #
51
 
@@ -243,8 +244,6 @@ def infer_batch(ref_audio, ref_text, gen_text_batches, exp_name, remove_silence,
243
 
244
  generated = generated[:, ref_audio_len:, :]
245
  generated_mel_spec = rearrange(generated, "1 n d -> 1 d n")
246
-
247
- vocos = Vocos.from_pretrained("charactr/vocos-mel-24khz")
248
  generated_wave = vocos.decode(generated_mel_spec.cpu())
249
  if rms < target_rms:
250
  generated_wave = generated_wave * rms / target_rms
 
46
  torch_dtype=torch.float16,
47
  device=device,
48
  )
49
+ vocos = Vocos.from_pretrained("charactr/vocos-mel-24khz")
50
 
51
  # --------------------- Settings -------------------- #
52
 
 
244
 
245
  generated = generated[:, ref_audio_len:, :]
246
  generated_mel_spec = rearrange(generated, "1 n d -> 1 d n")
 
 
247
  generated_wave = vocos.decode(generated_mel_spec.cpu())
248
  if rms < target_rms:
249
  generated_wave = generated_wave * rms / target_rms
inference-cli.py CHANGED
@@ -95,6 +95,7 @@ device = (
95
  if torch.cuda.is_available()
96
  else "mps" if torch.backends.mps.is_available() else "cpu"
97
  )
 
98
 
99
  print(f"Using {device} device")
100
 
@@ -286,8 +287,6 @@ def infer_batch(ref_audio, ref_text, gen_text_batches, model, remove_silence):
286
 
287
  generated = generated[:, ref_audio_len:, :]
288
  generated_mel_spec = rearrange(generated, "1 n d -> 1 d n")
289
-
290
- vocos = Vocos.from_pretrained("charactr/vocos-mel-24khz")
291
  generated_wave = vocos.decode(generated_mel_spec.cpu())
292
  if rms < target_rms:
293
  generated_wave = generated_wave * rms / target_rms
 
95
  if torch.cuda.is_available()
96
  else "mps" if torch.backends.mps.is_available() else "cpu"
97
  )
98
+ vocos = Vocos.from_pretrained("charactr/vocos-mel-24khz")
99
 
100
  print(f"Using {device} device")
101
 
 
287
 
288
  generated = generated[:, ref_audio_len:, :]
289
  generated_mel_spec = rearrange(generated, "1 n d -> 1 d n")
 
 
290
  generated_wave = vocos.decode(generated_mel_spec.cpu())
291
  if rms < target_rms:
292
  generated_wave = generated_wave * rms / target_rms