SWivid commited on
Commit
4a69e6b
·
1 Parent(s): 8718b1d

formatting

Browse files
Files changed (1) hide show
  1. src/f5_tts/infer/utils_infer.py +2 -1
src/f5_tts/infer/utils_infer.py CHANGED
@@ -221,7 +221,7 @@ def load_model(
221
  def remove_silence_edges(audio, silence_threshold=-42):
222
  # Remove silence from the start
223
  non_silent_start_idx = silence.detect_leading_silence(audio, silence_threshold=silence_threshold)
224
- audio = audio[non_silent_start_idx :]
225
 
226
  # Remove silence from the end
227
  non_silent_end_duration = audio.duration_seconds
@@ -272,6 +272,7 @@ def preprocess_ref_audio_text(ref_audio_orig, ref_text, clip_short=True, show_in
272
  if len(aseg) > 15000:
273
  aseg = aseg[:15000]
274
  show_info("Audio is over 15s, clipping short. (3)")
 
275
  aseg = remove_silence_edges(aseg) + AudioSegment.silent(duration=50)
276
  aseg.export(f.name, format="wav")
277
  ref_audio = f.name
 
221
  def remove_silence_edges(audio, silence_threshold=-42):
222
  # Remove silence from the start
223
  non_silent_start_idx = silence.detect_leading_silence(audio, silence_threshold=silence_threshold)
224
+ audio = audio[non_silent_start_idx:]
225
 
226
  # Remove silence from the end
227
  non_silent_end_duration = audio.duration_seconds
 
272
  if len(aseg) > 15000:
273
  aseg = aseg[:15000]
274
  show_info("Audio is over 15s, clipping short. (3)")
275
+
276
  aseg = remove_silence_edges(aseg) + AudioSegment.silent(duration=50)
277
  aseg.export(f.name, format="wav")
278
  ref_audio = f.name