Korakoe commited on
Commit
75eb448
1 Parent(s): 6e50b93

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +4 -4
app.py CHANGED
@@ -194,10 +194,10 @@ with gr.Blocks(theme=theme, js=js_func) as clone:
194
  with gr.Column(scale=1):
195
  inp = gr.Textbox(label="Text", info="What do you want Vokan to say?", interactive=True)
196
  voice = gr.Audio(label="Voice", interactive=True, type='filepath', max_length=300, waveform_options={'waveform_progress_color': '#FF593E'})
197
- steps = gr.Slider(minimum=3, maximum=60, value=20, step=1, label="Diffusion Steps", info="Higher produces better results typically", interactive=True)
198
- embscale = gr.Slider(minimum=1, maximum=10, value=2, step=0.1, label="Embedding Scale", info="Defaults to 2 | low scales may produce unexpected results", interactive=True)
199
- alpha = gr.Slider(minimum=0, maximum=1, value=0.3, step=0.1, label="Alpha", info="Defaults to 0.3", interactive=True)
200
- beta = gr.Slider(minimum=0, maximum=1, value=0.7, step=0.1, label="Beta", info="Defaults to 0.7", interactive=True)
201
  speed = gr.Slider(minimum=0.5, maximum=1.5, value=1, step=0.1, label="Speed of speech", info="Defaults to 1", interactive=True)
202
  with gr.Column(scale=1):
203
  clbtn = gr.Button("Synthesize", variant="primary")
 
194
  with gr.Column(scale=1):
195
  inp = gr.Textbox(label="Text", info="What do you want Vokan to say?", interactive=True)
196
  voice = gr.Audio(label="Voice", interactive=True, type='filepath', max_length=300, waveform_options={'waveform_progress_color': '#FF593E'})
197
+ steps = gr.Slider(minimum=3, maximum=100, value=20, step=1, label="Diffusion Steps", info="Higher produces better results typically", interactive=True)
198
+ embscale = gr.Slider(minimum=1, maximum=10, value=2, step=0.1, label="Embedding Scale", info="Defaults to 2 | High scales may produce unexpected results but may produce more emotional texts", interactive=True)
199
+ alpha = gr.Slider(minimum=0, maximum=1, value=0.3, step=0.1, label="Alpha", info="Defaults to 0.3 | Resemblance to speakers voice - lower = more similar", interactive=True)
200
+ beta = gr.Slider(minimum=0, maximum=1, value=0.7, step=0.1, label="Beta", info="Defaults to 0.7 | Resemblance to speakers prosody - lower = more similar - higher = based on sentence", interactive=True)
201
  speed = gr.Slider(minimum=0.5, maximum=1.5, value=1, step=0.1, label="Speed of speech", info="Defaults to 1", interactive=True)
202
  with gr.Column(scale=1):
203
  clbtn = gr.Button("Synthesize", variant="primary")