Spaces:
Configuration error
Configuration error
unknown
commited on
Commit
·
3dd59b8
1
Parent(s):
02d5913
when ref_text empty automatic transcribing
Browse files- src/f5_tts/api.py +9 -4
src/f5_tts/api.py
CHANGED
@@ -15,6 +15,9 @@ from f5_tts.infer.utils_infer import (
|
|
15 |
infer_process,
|
16 |
remove_silence_for_generated_wav,
|
17 |
save_spectrogram,
|
|
|
|
|
|
|
18 |
)
|
19 |
|
20 |
|
@@ -31,10 +34,8 @@ class F5TTS:
|
|
31 |
):
|
32 |
# Initialize parameters
|
33 |
self.final_wave = None
|
34 |
-
self.target_sample_rate =
|
35 |
-
self.
|
36 |
-
self.hop_length = 256
|
37 |
-
self.target_rms = 0.1
|
38 |
self.seed = -1
|
39 |
|
40 |
# Set device
|
@@ -97,6 +98,10 @@ class F5TTS:
|
|
97 |
seed = random.randint(0, sys.maxsize)
|
98 |
seed_everything(seed)
|
99 |
self.seed = seed
|
|
|
|
|
|
|
|
|
100 |
wav, sr, spect = infer_process(
|
101 |
ref_file,
|
102 |
ref_text,
|
|
|
15 |
infer_process,
|
16 |
remove_silence_for_generated_wav,
|
17 |
save_spectrogram,
|
18 |
+
preprocess_ref_audio_text,
|
19 |
+
target_sample_rate,
|
20 |
+
hop_length,
|
21 |
)
|
22 |
|
23 |
|
|
|
34 |
):
|
35 |
# Initialize parameters
|
36 |
self.final_wave = None
|
37 |
+
self.target_sample_rate = target_sample_rate
|
38 |
+
self.hop_length = hop_length
|
|
|
|
|
39 |
self.seed = -1
|
40 |
|
41 |
# Set device
|
|
|
98 |
seed = random.randint(0, sys.maxsize)
|
99 |
seed_everything(seed)
|
100 |
self.seed = seed
|
101 |
+
|
102 |
+
if ref_text == "":
|
103 |
+
ref_file, ref_text = preprocess_ref_audio_text(ref_file, ref_text, device=self.device)
|
104 |
+
|
105 |
wav, sr, spect = infer_process(
|
106 |
ref_file,
|
107 |
ref_text,
|