Spaces:
Configuration error
Configuration error
unknown
commited on
Commit
·
e636d98
1
Parent(s):
96e24d3
add transcribe function
Browse files- src/f5_tts/api.py +4 -0
src/f5_tts/api.py
CHANGED
@@ -15,6 +15,7 @@ from f5_tts.infer.utils_infer import (
|
|
15 |
preprocess_ref_audio_text,
|
16 |
remove_silence_for_generated_wav,
|
17 |
save_spectrogram,
|
|
|
18 |
target_sample_rate,
|
19 |
)
|
20 |
from f5_tts.model import DiT, UNetT
|
@@ -82,6 +83,9 @@ class F5TTS:
|
|
82 |
model_cls, model_cfg, ckpt_file, mel_spec_type, vocab_file, ode_method, use_ema, self.device
|
83 |
)
|
84 |
|
|
|
|
|
|
|
85 |
def export_wav(self, wav, file_wave, remove_silence=False):
|
86 |
sf.write(file_wave, wav, self.target_sample_rate)
|
87 |
|
|
|
15 |
preprocess_ref_audio_text,
|
16 |
remove_silence_for_generated_wav,
|
17 |
save_spectrogram,
|
18 |
+
transcribe,
|
19 |
target_sample_rate,
|
20 |
)
|
21 |
from f5_tts.model import DiT, UNetT
|
|
|
83 |
model_cls, model_cfg, ckpt_file, mel_spec_type, vocab_file, ode_method, use_ema, self.device
|
84 |
)
|
85 |
|
86 |
+
def transcribe(self, ref_audio, language=None):
|
87 |
+
return transcribe(ref_audio, language)
|
88 |
+
|
89 |
def export_wav(self, wav, file_wave, remove_silence=False):
|
90 |
sf.write(file_wave, wav, self.target_sample_rate)
|
91 |
|