Spaces:
Configuration error
Configuration error
formatting
Browse files
src/f5_tts/infer/utils_infer.py
CHANGED
@@ -221,7 +221,7 @@ def load_model(
|
|
221 |
def remove_silence_edges(audio, silence_threshold=-42):
|
222 |
# Remove silence from the start
|
223 |
non_silent_start_idx = silence.detect_leading_silence(audio, silence_threshold=silence_threshold)
|
224 |
-
audio = audio[non_silent_start_idx
|
225 |
|
226 |
# Remove silence from the end
|
227 |
non_silent_end_duration = audio.duration_seconds
|
@@ -272,6 +272,7 @@ def preprocess_ref_audio_text(ref_audio_orig, ref_text, clip_short=True, show_in
|
|
272 |
if len(aseg) > 15000:
|
273 |
aseg = aseg[:15000]
|
274 |
show_info("Audio is over 15s, clipping short. (3)")
|
|
|
275 |
aseg = remove_silence_edges(aseg) + AudioSegment.silent(duration=50)
|
276 |
aseg.export(f.name, format="wav")
|
277 |
ref_audio = f.name
|
|
|
221 |
def remove_silence_edges(audio, silence_threshold=-42):
|
222 |
# Remove silence from the start
|
223 |
non_silent_start_idx = silence.detect_leading_silence(audio, silence_threshold=silence_threshold)
|
224 |
+
audio = audio[non_silent_start_idx:]
|
225 |
|
226 |
# Remove silence from the end
|
227 |
non_silent_end_duration = audio.duration_seconds
|
|
|
272 |
if len(aseg) > 15000:
|
273 |
aseg = aseg[:15000]
|
274 |
show_info("Audio is over 15s, clipping short. (3)")
|
275 |
+
|
276 |
aseg = remove_silence_edges(aseg) + AudioSegment.silent(duration=50)
|
277 |
aseg.export(f.name, format="wav")
|
278 |
ref_audio = f.name
|