CosyVoice-300M

Runtime error

App Files Files Community

wenmeng.zwm commited on Jul 26

Commit

4905c07

•

1 Parent(s): fa47fc6

chinese to english

Browse files

Files changed (3) hide show

css/advanced.py +12 -11
css/custom.py +17 -16
css/preset.py +12 -9

css/advanced.py CHANGED Viewed

@@ -8,7 +8,7 @@ from css.utils import *
 # 高级语音生成
 def advanced():
-    sound_choices = ['中文女', '中文男', '日语男', '英文女', '英文男', '粤语女', '韩语女']
     def random_seed():
         return random.randint(1, 100000000)
@@ -18,7 +18,8 @@ def advanced():
                        _synthetic_input_textbox, _seed):
         print(_sound_radio, _speech_status_textbox, _synthetic_input_textbox, _seed)
         if _synthetic_input_textbox == '':
-            gr.Warning('合成文本为空，您是否忘记输入合成文本？')
             return (target_sr, default_data)
         set_all_random_seed(_seed)
         model = cosyvoice_instruct
@@ -29,27 +30,27 @@ def advanced():
     with gr.Column():
         sound_radio = gr.Radio(choices=sound_choices,
                                value=sound_choices[0],
-                               label="选择预置音色")
     with gr.Column():
-        speech_status_textbox = gr.Textbox(label="描述语音状态")
         gr.Examples(
-            label="示例控制文本",
             examples=[
                 ["Selene 'Moonshade', is a mysterious, elegant dancer with a connection to the night. Her movements are both mesmerizing and deadly. "],
                 ["A female speaker with normal pitch, slow speaking rate, and sad emotion."],
             ],
             inputs=[speech_status_textbox])
     with gr.Column():
-        synthetic_input_textbox = gr.Textbox(label="输入合成文本")
         gr.Examples(
-            label="示例文本",
             examples=example_tts_text,
             inputs=[synthetic_input_textbox])
-    with gr.Accordion(label="随机种子"):
         with gr.Row():
             with gr.Column(scale=1, min_width=180):
-                seed_button = gr.Button(value="\U0001F3B2 随机换一换",
                                         elem_classes="full-height")
             with gr.Column(scale=10):
                 seed = gr.Number(show_label=False,
@@ -57,10 +58,10 @@ def advanced():
                                  container=False,
                                  elem_classes="full-height")
     with gr.Column():
-        generate_button = gr.Button("生成音频", variant="primary", size="lg")
     with gr.Column():
-        output_audio = gr.Audio(label="合成音频")
     seed_button.click(fn=random_seed, outputs=[seed])
     generate_button.click(fn=generate_audio,

 # 高级语音生成
 def advanced():
+    sound_choices = ['Chinese Female', 'Chinese Male', 'Japanese Male', 'English Female', 'English Male', 'Cantonese Female', 'Korean Female']
     def random_seed():
         return random.randint(1, 100000000)
                        _synthetic_input_textbox, _seed):
         print(_sound_radio, _speech_status_textbox, _synthetic_input_textbox, _seed)
         if _synthetic_input_textbox == '':
+            #gr.Warning('合成文本为空，您是否忘记输入合成文本？')
+            gr.Warning('The synthesis text is empty, did you forget to input the synthesis text?')
             return (target_sr, default_data)
         set_all_random_seed(_seed)
         model = cosyvoice_instruct
     with gr.Column():
         sound_radio = gr.Radio(choices=sound_choices,
                                value=sound_choices[0],
+                               label="Select Preset Voice")
     with gr.Column():
+        speech_status_textbox = gr.Textbox(label="Describe Voice Status")
         gr.Examples(
+            label="Example of control text",
             examples=[
                 ["Selene 'Moonshade', is a mysterious, elegant dancer with a connection to the night. Her movements are both mesmerizing and deadly. "],
                 ["A female speaker with normal pitch, slow speaking rate, and sad emotion."],
             ],
             inputs=[speech_status_textbox])
     with gr.Column():
+        synthetic_input_textbox = gr.Textbox(label="Input Synthesis Text")
         gr.Examples(
+            label="example",
             examples=example_tts_text,
             inputs=[synthetic_input_textbox])
+    with gr.Accordion(label="Random Seed"):
         with gr.Row():
             with gr.Column(scale=1, min_width=180):
+                seed_button = gr.Button(value="\U0001F3B2 Shuffle Randomly",
                                         elem_classes="full-height")
             with gr.Column(scale=10):
                 seed = gr.Number(show_label=False,
                                  container=False,
                                  elem_classes="full-height")
     with gr.Column():
+        generate_button = gr.Button("Generate Audio", variant="primary", size="lg")
     with gr.Column():
+        output_audio = gr.Audio(label="Synthesize Audio")
     seed_button.click(fn=random_seed, outputs=[seed])
     generate_button.click(fn=generate_audio,

css/custom.py CHANGED Viewed

@@ -18,7 +18,8 @@ def custom():
         t1 = time.time()
         print(_recorded_audio, _prompt_input_textbox, _language_radio, _synthetic_input_textbox, _seed)
         if _synthetic_input_textbox == '':
-            gr.Warning('合成文本为空，您是否忘记输入合成文本？')
             return (target_sr, default_data)
         set_all_random_seed(_seed)
         if use_instruct(_synthetic_input_textbox):
@@ -45,33 +46,33 @@ def custom():
             with gr.Column(scale=1, min_width=400):
                 with gr.Group():
                     recorded_audio = gr.Audio(sources=['microphone'],
-                                              label="录制音频文件",
                                               type='filepath')
-                    gr.Text("请点击录制，并朗读右方文字（中文或英文）完成录入",
                             max_lines=1,
                             container=False,
                             interactive=False)
             with gr.Column(scale=10):
-                prompt_input_textbox = gr.Textbox(label="输入待录制文本")
                 gr.Examples(
-                    label="示例待录制文本",
                     examples=example_prompt_text,
                     inputs=[prompt_input_textbox])
     with gr.Column():
-        language_radio = gr.Radio(choices=[('同语种', 'same'), ('跨语种', 'cross')],
                                   value='same',
-                                  label="输入合成文本")
         synthetic_input_textbox = gr.Textbox(show_label=False)
         gr.Examples(
-            label="示例文本",
             examples=example_tts_text,
             inputs=[synthetic_input_textbox])
-    with gr.Accordion(label="随机种子"):
         with gr.Row():
             with gr.Column(scale=1, min_width=180):
-                seed_button = gr.Button(value="\U0001F3B2 随机换一换",
                                         elem_classes="full-height")
             with gr.Column(scale=10):
                 seed = gr.Number(show_label=False,
@@ -79,11 +80,11 @@ def custom():
                                  container=False,
                                  elem_classes="full-height")
     with gr.Column():
-        generate_button = gr.Button("生成音频", variant="primary", size="lg")
     with gr.Column():
-        output_audio = gr.Audio(label="合成音频")
     seed_button.click(fn=random_seed, outputs=[seed])
     generate_button.click(
         fn=generate_audio,

         t1 = time.time()
         print(_recorded_audio, _prompt_input_textbox, _language_radio, _synthetic_input_textbox, _seed)
         if _synthetic_input_textbox == '':
+            # gr.Warning('合成文本为空，您是否忘记输入合成文本？')
+            gr.Warning('The synthesis text is empty, did you forget to input the synthesis text?')
             return (target_sr, default_data)
         set_all_random_seed(_seed)
         if use_instruct(_synthetic_input_textbox):
             with gr.Column(scale=1, min_width=400):
                 with gr.Group():
                     recorded_audio = gr.Audio(sources=['microphone'],
+                                              label="Record Audio File",
                                               type='filepath')
+                    gr.Text("Please click to record and read the text on the right (Chinese or English) to complete the input",
                             max_lines=1,
                             container=False,
                             interactive=False)
             with gr.Column(scale=10):
+                prompt_input_textbox = gr.Textbox(label="Input Text for Recording")
                 gr.Examples(
+                    label="Example Recording Texts",
                     examples=example_prompt_text,
                     inputs=[prompt_input_textbox])
     with gr.Column():
+        language_radio = gr.Radio(choices=[('Same Language', 'same'), ('Cross Language', 'cross')],
                                   value='same',
+                                  label="Input Synthesis Text")
         synthetic_input_textbox = gr.Textbox(show_label=False)
         gr.Examples(
+            label="Example Texts",
             examples=example_tts_text,
             inputs=[synthetic_input_textbox])
+    with gr.Accordion(label="Random Seed"):
         with gr.Row():
             with gr.Column(scale=1, min_width=180):
+                seed_button = gr.Button(value="\U0001F3B2 Shuffle Randomly",
                                         elem_classes="full-height")
             with gr.Column(scale=10):
                 seed = gr.Number(show_label=False,
                                  container=False,
                                  elem_classes="full-height")
     with gr.Column():
+        generate_button = gr.Button("Generate Audio", variant="primary", size="lg")
     with gr.Column():
+        output_audio = gr.Audio(label="Synthesized Audio")
     seed_button.click(fn=random_seed, outputs=[seed])
     generate_button.click(
         fn=generate_audio,

css/preset.py CHANGED Viewed

@@ -8,7 +8,8 @@ from css.utils import *
 # 预置语音生成
 def preset():
-    sound_choices = ['中文女', '中文男', '英文女', '英文男', '日语男', '粤语女', '韩语女']
     def random_seed():
         return random.randint(1, 100000000)
@@ -17,7 +18,8 @@ def preset():
     def generate_audio(_sound_radio, _synthetic_input_textbox, _seed):
         print(_sound_radio, _synthetic_input_textbox, _seed)
         if _synthetic_input_textbox == '':
-            gr.Warning('合成文本为空，您是否忘记输入合成文本？')
             return (target_sr, default_data)
         set_all_random_seed(_seed)
         if use_instruct(_synthetic_input_textbox):
@@ -31,18 +33,19 @@ def preset():
     with gr.Column():
         sound_radio = gr.Radio(choices=sound_choices,
                                value=sound_choices[0],
-                               label="选择预置音色")
     with gr.Column():
-        synthetic_input_textbox = gr.Textbox(label="输入合成文本")
         gr.Examples(
-            label="示例文本",
             examples=example_tts_text,
             inputs=[synthetic_input_textbox])
-    with gr.Accordion(label="随机种子"):
         with gr.Row():
             with gr.Column(scale=1, min_width=180):
-                seed_button = gr.Button(value="\U0001F3B2 随机换一换",
                                         elem_classes="full-height")
             with gr.Column(scale=10):
                 seed = gr.Number(show_label=False,
@@ -50,10 +53,10 @@ def preset():
                                  container=False,
                                  elem_classes="full-height")
     with gr.Column():
-        generate_button = gr.Button("生成音频", variant="primary", size="lg")
     with gr.Column():
-        output_audio = gr.Audio(label="合成音频")
     seed_button.click(fn=random_seed, outputs=[seed])
     generate_button.click(fn=generate_audio,

 # 预置语音生成
 def preset():
+    #sound_choices = ['中文女', '中文男', '英文女', '英文男', '日语男', '粤语女', '韩语女']
+    sound_choices = ['Chinese Female', 'Chinese Male', 'Japanese Male', 'English Female', 'English Male', 'Cantonese Female', 'Korean Female']
     def random_seed():
         return random.randint(1, 100000000)
     def generate_audio(_sound_radio, _synthetic_input_textbox, _seed):
         print(_sound_radio, _synthetic_input_textbox, _seed)
         if _synthetic_input_textbox == '':
+            # gr.Warning('合成文本为空，您是否忘记输入合成文本？')
+            gr.Warning('The synthesis text is empty, did you forget to input the synthesis text?')
             return (target_sr, default_data)
         set_all_random_seed(_seed)
         if use_instruct(_synthetic_input_textbox):
     with gr.Column():
         sound_radio = gr.Radio(choices=sound_choices,
                                value=sound_choices[0],
+                               label="Select Preset Voice")
+                               #label="选择预置音色")
     with gr.Column():
+        synthetic_input_textbox = gr.Textbox(label="Input Synthesis Text")
         gr.Examples(
+            label="Example Text",
             examples=example_tts_text,
             inputs=[synthetic_input_textbox])
+    with gr.Accordion(label="Random Seed"):
         with gr.Row():
             with gr.Column(scale=1, min_width=180):
+                seed_button = gr.Button(value="\U0001F3B2 Shuffle randomly",
                                         elem_classes="full-height")
             with gr.Column(scale=10):
                 seed = gr.Number(show_label=False,
                                  container=False,
                                  elem_classes="full-height")
     with gr.Column():
+        generate_button = gr.Button("Generate audio", variant="primary", size="lg")
     with gr.Column():
+        output_audio = gr.Audio(label="Synthesize Audio")
     seed_button.click(fn=random_seed, outputs=[seed])
     generate_button.click(fn=generate_audio,