PoTaTo721 commited on
Commit
1c46b88
1 Parent(s): f4fbddd

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +8 -8
app.py CHANGED
@@ -150,13 +150,13 @@ def create_demo():
150
  notes = gr.Markdown(
151
  """
152
  # Fish Agent
153
- 1. 此Demo为Fish Audio自研端到端语言模型Fish Agent 3B版本.
154
- 2. 你可以在我们的官方仓库找到代码以及权重,但是相关内容全部基于 CC BY-NC-SA 4.0 许可证发布.
155
- 3. Demo为早期灰度测试版本,推理速度尚待优化.
156
- # 特色
157
- 1. 该模型自动集成ASRTTS部分,不需要外挂其它模型,即真正的端到端,而非三段式(ASR+LLM+TTS).
158
- 2. 模型可以使用reference audio控制说话音色.
159
- 3. 可以生成具有较强情感与韵律的音频.
160
  """
161
  )
162
 
@@ -169,7 +169,7 @@ def create_demo():
169
  )
170
  sys_text_input = gr.Textbox(
171
  label="What is your assistant's role?",
172
- value='您是由 Fish Audio 设计的语音助手,提供端到端的语音交互,实现无缝用户体验。首先转录用户的语音,然后使用以下格式回答:"Question: [用户语音]\n\nResponse: [你的回答]\n"。',
173
  type="text",
174
  )
175
  audio_input = gr.Audio(
 
150
  notes = gr.Markdown(
151
  """
152
  # Fish Agent
153
+ 1. This demo is the Fish Audio self-developed end-to-end language model Fish Agent 3B version.
154
+ 2. You can find the code and weights in our official repository, but all related content is released under the CC BY-NC-SA 4.0 license.
155
+ 3. The demo is an early beta version, and inference speed is yet to be optimized.
156
+ # Features
157
+ 1. This model automatically integrates ASR and TTS components, requiring no external models, making it truly end-to-end rather than a three-stage process (ASR+LLM+TTS).
158
+ 2. The model can use reference audio to control speaking voice.
159
+ 3. It can generate audio with strong emotions and prosody.
160
  """
161
  )
162
 
 
169
  )
170
  sys_text_input = gr.Textbox(
171
  label="What is your assistant's role?",
172
+ value='You are a voice assistant created by Fish Audio, offering end-to-end voice interaction for a seamless user experience. You are required to first transcribe the user's speech, then answer it in the following format: "Question: [USER_SPEECH]\n\nResponse: [YOUR_RESPONSE]\n"。You are required to use the following voice in this conversation.',
173
  type="text",
174
  )
175
  audio_input = gr.Audio(