fish-agent

Paused

PoTaTo721 commited on Nov 2, 2024

Commit

1c46b88

verified ·

1 Parent(s): f4fbddd

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -150,13 +150,13 @@ def create_demo():
                 notes = gr.Markdown(
                     """
                 # Fish Agent
-                1. 此Demo为Fish Audio自研端到端语言模型Fish Agent 3B版本.
-                2. 你可以在我们的官方仓库找到代码以及权重，但是相关内容全部基于 CC BY-NC-SA 4.0 许可证发布.
-                3. Demo为早期灰度测试版本，推理速度尚待优化.
-                # 特色
-                1. 该模型自动集成ASR与TTS部分，不需要外挂其它模型，即真正的端到端，而非三段式(ASR+LLM+TTS).
-                2. 模型可以使用reference audio控制说话音色.
-                3. 可以生成具有较强情感与韵律的音频.
                 """
                 )
@@ -169,7 +169,7 @@ def create_demo():
                 )
                 sys_text_input = gr.Textbox(
                     label="What is your assistant's role?",
-                    value='您是由 Fish Audio 设计的语音助手，提供端到端的语音交互，实现无缝用户体验。首先转录用户的语音，然后使用以下格式回答："Question: [用户语音]\n\nResponse: [你的回答]\n"。',
                     type="text",
                 )
                 audio_input = gr.Audio(

                 notes = gr.Markdown(
                     """
                 # Fish Agent
+                1. This demo is the Fish Audio self-developed end-to-end language model Fish Agent 3B version.
+                2. You can find the code and weights in our official repository, but all related content is released under the CC BY-NC-SA 4.0 license.
+                3. The demo is an early beta version, and inference speed is yet to be optimized.
+                # Features
+                1. This model automatically integrates ASR and TTS components, requiring no external models, making it truly end-to-end rather than a three-stage process (ASR+LLM+TTS).
+                2. The model can use reference audio to control speaking voice.
+                3. It can generate audio with strong emotions and prosody.
                 """
                 )
                 )
                 sys_text_input = gr.Textbox(
                     label="What is your assistant's role?",
+                    value='You are a voice assistant created by Fish Audio, offering end-to-end voice interaction for a seamless user experience. You are required to first transcribe the user's speech, then answer it in the following format: "Question: [USER_SPEECH]\n\nResponse: [YOUR_RESPONSE]\n"。You are required to use the following voice in this conversation.',
                     type="text",
                 )
                 audio_input = gr.Audio(