TaiYouWeb commited on
Commit
6b28214
·
verified ·
1 Parent(s): 50b0eff

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +3 -1
app.py CHANGED
@@ -26,6 +26,7 @@ model = AutoModel(
26
  trust_remote_code=False,
27
  remote_code="./model.py",
28
  vad_model="fsmn-vad",
 
29
  spk_model="cam++",
30
  vad_kwargs={"max_single_segment_time": 15000},
31
  ncpu=torch.get_num_threads(),
@@ -34,7 +35,7 @@ model = AutoModel(
34
  device=device,
35
  )
36
 
37
- def transcribe_audio(file_path, vad_model="fsmn-vad", spk_model="cam++", vad_kwargs='{"max_single_segment_time": 15000}',
38
  batch_size=1, language="auto", use_itn=True, batch_size_s=60,
39
  merge_vad=True, merge_length_s=15, batch_size_threshold_s=50,
40
  hotword=" ", ban_emo_unk=True):
@@ -66,6 +67,7 @@ def transcribe_audio(file_path, vad_model="fsmn-vad", spk_model="cam++", vad_kwa
66
  inputs = [
67
  gr.Audio(type="filepath"),
68
  gr.Textbox(value="fsmn-vad", label="VAD Model"),
 
69
  gr.Textbox(value="cam++", label="SPK Model"),
70
  gr.Textbox(value='{"max_single_segment_time": 15000}', label="VAD Kwargs"),
71
  gr.Slider(1, 10, value=1, step=1, label="Batch Size"),
 
26
  trust_remote_code=False,
27
  remote_code="./model.py",
28
  vad_model="fsmn-vad",
29
+ punc_model="iic/speech_paraformer-large-vad-punc_asr_nat-zh-cn-16k-common-vocab8404-pytorch",
30
  spk_model="cam++",
31
  vad_kwargs={"max_single_segment_time": 15000},
32
  ncpu=torch.get_num_threads(),
 
35
  device=device,
36
  )
37
 
38
+ def transcribe_audio(file_path, vad_model="fsmn-vad", punc_model="ct-punc", spk_model="cam++", vad_kwargs='{"max_single_segment_time": 15000}',
39
  batch_size=1, language="auto", use_itn=True, batch_size_s=60,
40
  merge_vad=True, merge_length_s=15, batch_size_threshold_s=50,
41
  hotword=" ", ban_emo_unk=True):
 
67
  inputs = [
68
  gr.Audio(type="filepath"),
69
  gr.Textbox(value="fsmn-vad", label="VAD Model"),
70
+ gr.Textbox(value="iic/speech_paraformer-large-vad-punc_asr_nat-zh-cn-16k-common-vocab8404-pytorch", label="PUNC Model"),
71
  gr.Textbox(value="cam++", label="SPK Model"),
72
  gr.Textbox(value='{"max_single_segment_time": 15000}', label="VAD Kwargs"),
73
  gr.Slider(1, 10, value=1, step=1, label="Batch Size"),