Spaces:
Running
on
Zero
Running
on
Zero
Update app.py
Browse files
app.py
CHANGED
@@ -186,7 +186,7 @@ def text_to_phonemes(text):
|
|
186 |
|
187 |
|
188 |
@spaces.GPU
|
189 |
-
def generate(audio_path, ins, speed, alpha, beta, embedding, steps=
|
190 |
ref_s = other_tts.compute_style(audio_path)
|
191 |
print(ref_s.size())
|
192 |
s_prev = None
|
@@ -199,7 +199,7 @@ def generate(audio_path, ins, speed, alpha, beta, embedding, steps=100, vocos=Fa
|
|
199 |
synthaud, s_prev = other_tts.long_inference_segment(i, diffusion_steps=steps,
|
200 |
alpha=alpha, beta=beta, is_phonemes=True,
|
201 |
embedding_scale=embedding, prev_s=s_prev, ref_s=ref_s,
|
202 |
-
speed=speed, t=0.8)
|
203 |
|
204 |
n_trim = int(len(synthaud) * 0.009)
|
205 |
synthaud[:n_trim] = 0
|
|
|
186 |
|
187 |
|
188 |
@spaces.GPU
|
189 |
+
def generate(audio_path, ins, speed, alpha, beta, embedding, steps=200, vocos=False):
|
190 |
ref_s = other_tts.compute_style(audio_path)
|
191 |
print(ref_s.size())
|
192 |
s_prev = None
|
|
|
199 |
synthaud, s_prev = other_tts.long_inference_segment(i, diffusion_steps=steps,
|
200 |
alpha=alpha, beta=beta, is_phonemes=True,
|
201 |
embedding_scale=embedding, prev_s=s_prev, ref_s=ref_s,
|
202 |
+
speed=speed, t=0.8, vocos=vocos)
|
203 |
|
204 |
n_trim = int(len(synthaud) * 0.009)
|
205 |
synthaud[:n_trim] = 0
|