Spaces:
Running
on
CPU Upgrade
Running
on
CPU Upgrade
add speed
Browse files
app.py
CHANGED
@@ -20,7 +20,7 @@ def get_text(text, hps):
|
|
20 |
|
21 |
|
22 |
def create_tts_fn(model, hps, speaker_ids):
|
23 |
-
def tts_fn(text, speaker):
|
24 |
if len(text) > 150:
|
25 |
return "Error: Text is too long", None
|
26 |
speaker_id = speaker_ids[speaker]
|
@@ -29,9 +29,8 @@ def create_tts_fn(model, hps, speaker_ids):
|
|
29 |
x_tst = stn_tst.unsqueeze(0)
|
30 |
x_tst_lengths = LongTensor([stn_tst.size(0)])
|
31 |
sid = LongTensor([speaker_id])
|
32 |
-
audio =
|
33 |
-
|
34 |
-
0, 0].data.cpu().float().numpy()
|
35 |
return "Success", (hps.data.sampling_rate, audio)
|
36 |
|
37 |
return tts_fn
|
@@ -112,10 +111,12 @@ if __name__ == '__main__':
|
|
112 |
tts_input1 = gr.TextArea(label="Text (150 words limitation)", value="γγγ«γ‘γ―γ")
|
113 |
tts_input2 = gr.Dropdown(label="Speaker", choices=speakers,
|
114 |
type="index", value=speakers[0])
|
|
|
115 |
tts_submit = gr.Button("Generate", variant="primary")
|
116 |
tts_output1 = gr.Textbox(label="Output Message")
|
117 |
tts_output2 = gr.Audio(label="Output Audio")
|
118 |
-
tts_submit.click(tts_fn, [tts_input1, tts_input2
|
|
|
119 |
with gr.TabItem("Voice Conversion"):
|
120 |
with gr.Tabs():
|
121 |
for i, (models_name, cover_path, speakers, tts_fn, vc_fn) in enumerate(models):
|
|
|
20 |
|
21 |
|
22 |
def create_tts_fn(model, hps, speaker_ids):
|
23 |
+
def tts_fn(text, speaker, speed):
|
24 |
if len(text) > 150:
|
25 |
return "Error: Text is too long", None
|
26 |
speaker_id = speaker_ids[speaker]
|
|
|
29 |
x_tst = stn_tst.unsqueeze(0)
|
30 |
x_tst_lengths = LongTensor([stn_tst.size(0)])
|
31 |
sid = LongTensor([speaker_id])
|
32 |
+
audio = model.infer(x_tst, x_tst_lengths, sid=sid, noise_scale=.667, noise_scale_w=0.8,
|
33 |
+
length_scale=1.0 / speed)[0][0, 0].data.cpu().float().numpy()
|
|
|
34 |
return "Success", (hps.data.sampling_rate, audio)
|
35 |
|
36 |
return tts_fn
|
|
|
111 |
tts_input1 = gr.TextArea(label="Text (150 words limitation)", value="γγγ«γ‘γ―γ")
|
112 |
tts_input2 = gr.Dropdown(label="Speaker", choices=speakers,
|
113 |
type="index", value=speakers[0])
|
114 |
+
tts_input3 = gr.Slider(label="Speed", value=1, minimum=0.5, maximum=2, step=0.1)
|
115 |
tts_submit = gr.Button("Generate", variant="primary")
|
116 |
tts_output1 = gr.Textbox(label="Output Message")
|
117 |
tts_output2 = gr.Audio(label="Output Audio")
|
118 |
+
tts_submit.click(tts_fn, [tts_input1, tts_input2, tts_input3],
|
119 |
+
[tts_output1, tts_output2])
|
120 |
with gr.TabItem("Voice Conversion"):
|
121 |
with gr.Tabs():
|
122 |
for i, (models_name, cover_path, speakers, tts_fn, vc_fn) in enumerate(models):
|