Spaces:

ShoukanLabs
/

Vokan

Running on Zero

App Files Files Community

ButterCream commited on Mar 28

Commit

9d1687b

•

1 Parent(s): 9ef0c39

attempt fix examples

Browse files

Files changed (1) hide show

app.py +30 -27

app.py CHANGED Viewed

@@ -61,23 +61,24 @@ function refresh() {
     }
 }
 """
-examples = [
-    ["./Examples/David Attenborough.mp3",
-     "An understanding of the natural world is a source of not only great curiosity, but great fulfilment.",
-     1, 0.2, 0.5, 2, 100],
-    ["./Examples/Linus Tech Tips.mp3",
-     "sometimes I get so in the zone while building a computer it's like an out of body experience.",
-     1, 0.3, 0.8, 2, 100],
-    ["./Examples/Melina.mp3",
-     "If you intend to claim the Frenzied Flame, I ask that you cease. It is not to be meddled with. It is chaos, "
-     "devouring life and thought unending. However ruined this world has become, "
-     "however mired in torment and despair, life endures.",
-     1, 0.3, 0.5, 2, 100],
-    ["./Examples/Patrick Bateman.mp3",
-     "My Pain Is Constant And Sharp, And I Do Not Wish For A Better World For Anyone.",
-     1, 0.3, 0.6, 2, 100]
-]
 theme = gr.themes.Soft(
     primary_hue=gr.themes.Color(c100="#ffd7d1", c200="#ff593e", c300="#ff593e", c400="#ff593e", c50="#fff0f0",
@@ -210,16 +211,16 @@ with gr.Blocks(theme=theme, js=js_func) as clone:
     gr.HTML(INTRO)
     with gr.Row():
         with gr.Column(scale=1):
-            inp = gr.Textbox(label="Text", info="What do you want Vokan to say?", interactive=True)
-            voice = gr.Audio(label="Voice", interactive=True, type='filepath', max_length=300,
                              waveform_options={'waveform_progress_color': '#FF593E'})
-            steps = gr.Slider(minimum=3, maximum=60, value=20, step=1, label="Diffusion Steps",
                               info="Higher produces better results typically", interactive=True)
-            embscale = gr.Slider(minimum=1, maximum=10, value=2, step=0.1, label="Embedding Scale",
-                                 info="Defaults to 2 | low scales may produce unexpected results", interactive=True)
-            alpha = gr.Slider(minimum=0, maximum=1, value=0.3, step=0.1, label="Alpha", info="Defaults to 0.3",
                               interactive=True)
-            beta = gr.Slider(minimum=0, maximum=1, value=0.7, step=0.1, label="Beta", info="Defaults to 0.7",
                              interactive=True)
             speed = gr.Slider(minimum=0.5, maximum=1.5, value=1, step=0.1, label="Speed of speech",
                               info="Defaults to 1", interactive=True)
@@ -228,11 +229,13 @@ with gr.Blocks(theme=theme, js=js_func) as clone:
             claudio = gr.Audio(interactive=False, label="Synthesized Audio",
                                waveform_options={'waveform_progress_color': '#FF593E'})
             clbtn.click(generate, inputs=[voice, inp, speed, alpha, beta, embscale, steps], outputs=[claudio],
-                        concurrency_limit=4)
-            gr.Examples(examples=examples,
                         inputs=[voice, inp, speed, alpha, beta, embscale, steps],
-                        outputs=[claudio])
 if __name__ == "__main__":
     # demo.queue(api_open=False, max_size=15).launch(show_api=False)

     }
 }
 """
+def get_example():
+    examples = [
+        ["./Examples/David Attenborough.mp3",
+        "An understanding of the natural world is a source of not only great curiosity, but great fulfilment.",
+        1, 0.2, 0.5, 2, 100],
+        ["./Examples/Linus Tech Tips.mp3",
+        "sometimes I get so in the zone while building a computer it's like an out of body experience.",
+        1, 0.3, 0.8, 2, 100],
+        ["./Examples/Melina.mp3",
+        "If you intend to claim the Frenzied Flame, I ask that you cease. It is not to be meddled with. It is chaos, "
+        "devouring life and thought unending. However ruined this world has become, "
+        "however mired in torment and despair, life endures.",
+        1, 0.3, 0.5, 2, 100],
+        ["./Examples/Patrick Bateman.mp3",
+        "My Pain Is Constant And Sharp, And I Do Not Wish For A Better World For Anyone.",
+        1, 0.3, 0.6, 2, 100]
+    ]
+    return examples
 theme = gr.themes.Soft(
     primary_hue=gr.themes.Color(c100="#ffd7d1", c200="#ff593e", c300="#ff593e", c400="#ff593e", c50="#fff0f0",
     gr.HTML(INTRO)
     with gr.Row():
         with gr.Column(scale=1):
+            inp = gr.Textbox(label="Text", info="What do you want Vokan to say? | Longform generation may produce artifacts in between sentences", interactive=True)
+            voice = gr.Audio(label="Voice", interactive=True, type='filepath', max_length=1000,
                              waveform_options={'waveform_progress_color': '#FF593E'})
+            steps = gr.Slider(minimum=3, maximum=200, value=20, step=1, label="Diffusion Steps | Higher generally = better",
                               info="Higher produces better results typically", interactive=True)
+            embscale = gr.Slider(minimum=1, maximum=5, value=2, step=0.1, label="Embedding Scale",
+                                 info="Defaults to 2 | high scales may produce unexpected results | Higher scales produce more emotion guided reults", interactive=True)
+            alpha = gr.Slider(minimum=0, maximum=1, value=0.3, step=0.1, label="Alpha | Lower = More similar in sound to speaker", info="Defaults to 0.3",
                               interactive=True)
+            beta = gr.Slider(minimum=0, maximum=1, value=0.7, step=0.1, label="Beta | Lower = More similar prosody at cost of stability", info="Defaults to 0.7",
                              interactive=True)
             speed = gr.Slider(minimum=0.5, maximum=1.5, value=1, step=0.1, label="Speed of speech",
                               info="Defaults to 1", interactive=True)
             claudio = gr.Audio(interactive=False, label="Synthesized Audio",
                                waveform_options={'waveform_progress_color': '#FF593E'})
             clbtn.click(generate, inputs=[voice, inp, speed, alpha, beta, embscale, steps], outputs=[claudio],
+                        concurrency_limit=15)
+            gr.Examples(examples=get_example(),
                         inputs=[voice, inp, speed, alpha, beta, embscale, steps],
+                        outputs=[claudio],
+                        fn=generate,
+                        cache_examples=True,)
 if __name__ == "__main__":
     # demo.queue(api_open=False, max_size=15).launch(show_api=False)