kevinwang676 commited on
Commit
605cc0d
·
1 Parent(s): 7439dde

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +16 -15
app.py CHANGED
@@ -255,13 +255,14 @@ speakers_list.insert(0, "nana.npz")
255
 
256
  # Create Gradio Blocks
257
 
258
- with gr.Blocks(title="Bark Enhanced Gradio GUI", mode="Bark Enhanced") as barkgui:
259
- gr.Markdown("### [Bark Enhanced v0.4.0](https://github.com/C0untFloyd/bark-gui)")
260
- with gr.Tab("TTS"):
 
261
  with gr.Row():
262
  with gr.Column():
263
- placeholder = "Enter text here."
264
- input_text = gr.Textbox(label="Input Text", lines=4, placeholder=placeholder)
265
  with gr.Column():
266
  convert_to_ssml_button = gr.Button("Convert Text to SSML", visible=False)
267
  with gr.Row():
@@ -290,15 +291,15 @@ with gr.Blocks(title="Bark Enhanced Gradio GUI", mode="Bark Enhanced") as barkgu
290
 
291
  with gr.Row():
292
  with gr.Column():
293
- gr.Markdown("[Voice Prompt Library](https://suno-ai.notion.site/8b8e8749ed514b0cbf3f699013548683?v=bc67cff786b04b50b3ceb756fd05f68c)")
294
- speaker = gr.Dropdown(speakers_list, value=speakers_list[0], label="Voice")
295
  with gr.Column():
296
  text_temp = gr.Slider(0.1, 1.0, value=0.7, label="Generation Temperature", info="1.0 more diverse, 0.1 more conservative")
297
  waveform_temp = gr.Slider(0.1, 1.0, value=0.7, label="Waveform temperature", info="1.0 more diverse, 0.1 more conservative")
298
 
299
  with gr.Row():
300
  with gr.Column():
301
- quick_gen_checkbox = gr.Checkbox(label="Quick Generation", value=True)
302
  with gr.Column():
303
  settings_checkboxes = ["Use semantic history", "Use coarse history", "Use fine history", "Use last generation as history"]
304
  complete_settings = gr.CheckboxGroup(choices=settings_checkboxes, value=settings_checkboxes, label="Detailed Generation Settings", type="value", interactive=True, visible=False)
@@ -306,22 +307,22 @@ with gr.Blocks(title="Bark Enhanced Gradio GUI", mode="Bark Enhanced") as barkgu
306
 
307
  with gr.Row():
308
  with gr.Column():
309
- tts_create_button = gr.Button("Generate")
310
  with gr.Column():
311
  hidden_checkbox = gr.Checkbox(visible=False)
312
  button_delete_files = gr.Button("Clear output folder", visible=False)
313
  with gr.Row():
314
- output_audio = gr.Audio(label="Generated Audio", type="filepath")
315
 
316
- with gr.Tab("Clone Voice"):
317
  input_audio_filename = gr.Audio(label="Input audio.wav", source="upload", type="filepath")
318
  transcription_text = gr.Textbox(label="Transcription Text", lines=1, placeholder="Enter Text of your Audio Sample here...")
319
  initialname = "Custom_voice"
320
  #inputAudioFilename = gr.Textbox(label="Filename of Input Audio", lines=1, placeholder="audio.wav")
321
- output_voice = gr.Textbox(label="Filename of trained Voice", lines=1, placeholder=initialname, value=initialname)
322
- clone_voice_button = gr.Button("Create Voice")
323
- dummy = gr.Text(label="Progress")
324
- npz_file_1 = gr.File(label=".npz file")
325
 
326
  convert_to_ssml_button.click(convert_text_to_ssml, inputs=[input_text, speaker],outputs=input_text)
327
  tts_create_button.click(generate_text_to_speech, inputs=[input_text, speaker, text_temp, waveform_temp, quick_gen_checkbox, complete_settings],outputs=output_audio)
 
255
 
256
  # Create Gradio Blocks
257
 
258
+ with gr.Blocks(title="🐶🥳🎶 - Bark声音合成,开启声音真实复刻的新纪元!", mode="Bark Enhanced") as barkgui:
259
+ gr.Markdown("### <center>🦄 - [Bark](https://github.com/suno-ai/bark)拟声,能够实现语音、语调及说话情感的真实复刻</center>")
260
+ gr.Markdown("### <center>Powered by [Bark Enhanced v0.4.0](https://github.com/C0untFloyd/bark-gui). Thanks to C0untFloyd.</center>")
261
+ with gr.Tab("🐶 - Bark拟声"):
262
  with gr.Row():
263
  with gr.Column():
264
+ placeholder = "想让Bark说些什么呢?"
265
+ input_text = gr.Textbox(label="用作声音合成的文本", lines=4, placeholder=placeholder)
266
  with gr.Column():
267
  convert_to_ssml_button = gr.Button("Convert Text to SSML", visible=False)
268
  with gr.Row():
 
291
 
292
  with gr.Row():
293
  with gr.Column():
294
+ gr.Markdown("查看Bark官方的[语言库](https://suno-ai.notion.site/8b8e8749ed514b0cbf3f699013548683?v=bc67cff786b04b50b3ceb756fd05f68c)")
295
+ speaker = gr.Dropdown(speakers_list, value=speakers_list[0], label="中英双语的不同声音供您选择")
296
  with gr.Column():
297
  text_temp = gr.Slider(0.1, 1.0, value=0.7, label="Generation Temperature", info="1.0 more diverse, 0.1 more conservative")
298
  waveform_temp = gr.Slider(0.1, 1.0, value=0.7, label="Waveform temperature", info="1.0 more diverse, 0.1 more conservative")
299
 
300
  with gr.Row():
301
  with gr.Column():
302
+ quick_gen_checkbox = gr.Checkbox(label="是否要快速合成语音", value=True)
303
  with gr.Column():
304
  settings_checkboxes = ["Use semantic history", "Use coarse history", "Use fine history", "Use last generation as history"]
305
  complete_settings = gr.CheckboxGroup(choices=settings_checkboxes, value=settings_checkboxes, label="Detailed Generation Settings", type="value", interactive=True, visible=False)
 
307
 
308
  with gr.Row():
309
  with gr.Column():
310
+ tts_create_button = gr.Button("开始生成语音吧")
311
  with gr.Column():
312
  hidden_checkbox = gr.Checkbox(visible=False)
313
  button_delete_files = gr.Button("Clear output folder", visible=False)
314
  with gr.Row():
315
+ output_audio = gr.Audio(label="听听Bark为您复刻的语音吧", type="filepath")
316
 
317
+ with gr.Tab("🎶 - 声音克隆"):
318
  input_audio_filename = gr.Audio(label="Input audio.wav", source="upload", type="filepath")
319
  transcription_text = gr.Textbox(label="Transcription Text", lines=1, placeholder="Enter Text of your Audio Sample here...")
320
  initialname = "Custom_voice"
321
  #inputAudioFilename = gr.Textbox(label="Filename of Input Audio", lines=1, placeholder="audio.wav")
322
+ output_voice = gr.Textbox(label="为您的专属声音起个名字吧", lines=1, placeholder=initialname, value=initialname)
323
+ clone_voice_button = gr.Button("生成.npz文件")
324
+ dummy = gr.Text(label="进度")
325
+ npz_file_1 = gr.File(label="请下载您的专属.npz文件")
326
 
327
  convert_to_ssml_button.click(convert_text_to_ssml, inputs=[input_text, speaker],outputs=input_text)
328
  tts_create_button.click(generate_text_to_speech, inputs=[input_text, speaker, text_temp, waveform_temp, quick_gen_checkbox, complete_settings],outputs=output_audio)