Spaces:
Running
on
Zero
Running
on
Zero
Update app.py
Browse files
app.py
CHANGED
@@ -194,10 +194,10 @@ with gr.Blocks(theme=theme, js=js_func) as clone:
|
|
194 |
with gr.Column(scale=1):
|
195 |
inp = gr.Textbox(label="Text", info="What do you want Vokan to say?", interactive=True)
|
196 |
voice = gr.Audio(label="Voice", interactive=True, type='filepath', max_length=300, waveform_options={'waveform_progress_color': '#FF593E'})
|
197 |
-
steps = gr.Slider(minimum=3, maximum=
|
198 |
-
embscale = gr.Slider(minimum=1, maximum=10, value=2, step=0.1, label="Embedding Scale", info="Defaults to 2 |
|
199 |
-
alpha = gr.Slider(minimum=0, maximum=1, value=0.3, step=0.1, label="Alpha", info="Defaults to 0.3", interactive=True)
|
200 |
-
beta = gr.Slider(minimum=0, maximum=1, value=0.7, step=0.1, label="Beta", info="Defaults to 0.7", interactive=True)
|
201 |
speed = gr.Slider(minimum=0.5, maximum=1.5, value=1, step=0.1, label="Speed of speech", info="Defaults to 1", interactive=True)
|
202 |
with gr.Column(scale=1):
|
203 |
clbtn = gr.Button("Synthesize", variant="primary")
|
|
|
194 |
with gr.Column(scale=1):
|
195 |
inp = gr.Textbox(label="Text", info="What do you want Vokan to say?", interactive=True)
|
196 |
voice = gr.Audio(label="Voice", interactive=True, type='filepath', max_length=300, waveform_options={'waveform_progress_color': '#FF593E'})
|
197 |
+
steps = gr.Slider(minimum=3, maximum=100, value=20, step=1, label="Diffusion Steps", info="Higher produces better results typically", interactive=True)
|
198 |
+
embscale = gr.Slider(minimum=1, maximum=10, value=2, step=0.1, label="Embedding Scale", info="Defaults to 2 | High scales may produce unexpected results but may produce more emotional texts", interactive=True)
|
199 |
+
alpha = gr.Slider(minimum=0, maximum=1, value=0.3, step=0.1, label="Alpha", info="Defaults to 0.3 | Resemblance to speakers voice - lower = more similar", interactive=True)
|
200 |
+
beta = gr.Slider(minimum=0, maximum=1, value=0.7, step=0.1, label="Beta", info="Defaults to 0.7 | Resemblance to speakers prosody - lower = more similar - higher = based on sentence", interactive=True)
|
201 |
speed = gr.Slider(minimum=0.5, maximum=1.5, value=1, step=0.1, label="Speed of speech", info="Defaults to 1", interactive=True)
|
202 |
with gr.Column(scale=1):
|
203 |
clbtn = gr.Button("Synthesize", variant="primary")
|