AdalAbilbekov commited on
Commit
d2969a7
1 Parent(s): 4b2875e

final commit

Browse files
g_01720000 → CNN_SGD_001_1885.pt RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:fa0a76a49573909b968708717138849d68d9627cdf03307d00c7bd49278dc573
3
- size 55824433
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6ac783b9b049185deaa258d2c2c8ba1b1311451ea9fa74e83919130b529f2b2a
3
+ size 1748943
__pycache__/data_collate.cpython-39.pyc ADDED
Binary file (5.77 kB). View file
 
__pycache__/data_loader.cpython-39.pyc ADDED
Binary file (11.4 kB). View file
 
__pycache__/env.cpython-39.pyc ADDED
Binary file (840 Bytes). View file
 
__pycache__/models.cpython-39.pyc ADDED
Binary file (8.75 kB). View file
 
__pycache__/utils_data.cpython-39.pyc ADDED
Binary file (11.9 kB). View file
 
__pycache__/xutils.cpython-39.pyc ADDED
Binary file (2.05 kB). View file
 
app.py CHANGED
@@ -39,7 +39,9 @@ model = SpecClassifier(
39
  model_type=getattr(hps.model, "classifier_type", "CNN-with-time")
40
  )
41
 
42
- ckpt = './cnnwt_SGD_1959.pt'
 
 
43
  ckpt_tts = './grad_uncond_cnn_001.pt'
44
 
45
  utils.load_checkpoint_no_logger(ckpt_tts, gradtts_uncond_model, None)
@@ -70,7 +72,7 @@ def generate_audio(text, quantity, speaker, emotion_1, emotion_2):
70
 
71
  y_enc, y_dec, attn = gradtts_uncond_model.classifier_guidance_decode_two_mixture(
72
  x, x_lengths,
73
- n_timesteps=10,
74
  temperature=2.0,
75
  stoc=args.stoc,
76
  spk=sid,
@@ -83,9 +85,8 @@ def generate_audio(text, quantity, speaker, emotion_1, emotion_2):
83
  classifier_type=model.model_type
84
  )
85
  y_dec = y_dec.detach()
86
- # y_dec = torch.nan_to_num(y_dec)
87
- res = y_dec.squeeze().cpu().numpy()
88
- x = torch.from_numpy(res).cuda().unsqueeze(0)
89
  y_g_hat = vocoder(x)
90
  audio = y_g_hat.squeeze()
91
  audio = audio * 32768.0
@@ -102,8 +103,8 @@ spekears = ['Madi', 'Marzhan', 'Akzhol']
102
  demo = gr.Interface(
103
  generate_audio,
104
  [
105
- gr.Textbox(value='Сәлем', label="Text you want to synthesize"),
106
- gr.Slider(0, 100, value=0, step=10, label="Count", info="Choose between 0 and 100"),
107
  gr.Dropdown(spekears, value=spekears[1], label="Narrator", info="Select a narrator."
108
  ),
109
  gr.Dropdown(emotions, label="Emotion 1", info="Select first emotion"),
 
39
  model_type=getattr(hps.model, "classifier_type", "CNN-with-time")
40
  )
41
 
42
+ # ckpt = './cnnwt_SGD_1959.pt'
43
+ # ckpt_tts = './grad_uncond_cnn_001.pt'
44
+ ckpt = './CNN_SGD_001_1885.pt'
45
  ckpt_tts = './grad_uncond_cnn_001.pt'
46
 
47
  utils.load_checkpoint_no_logger(ckpt_tts, gradtts_uncond_model, None)
 
72
 
73
  y_enc, y_dec, attn = gradtts_uncond_model.classifier_guidance_decode_two_mixture(
74
  x, x_lengths,
75
+ n_timesteps=100,
76
  temperature=2.0,
77
  stoc=args.stoc,
78
  spk=sid,
 
85
  classifier_type=model.model_type
86
  )
87
  y_dec = y_dec.detach()
88
+ res = y_dec.squeeze().to(device).numpy()
89
+ x = torch.from_numpy(res).unsqueeze(0)
 
90
  y_g_hat = vocoder(x)
91
  audio = y_g_hat.squeeze()
92
  audio = audio * 32768.0
 
103
  demo = gr.Interface(
104
  generate_audio,
105
  [
106
+ gr.Textbox(value='Батпақ соры шабындыққа және жыл бойғы жайылымға пайдаланылады.', label="Text you want to synthesize"),
107
+ gr.Slider(0, 100, value=50, step=10, label="Count", info="Choose between 0 and 100"),
108
  gr.Dropdown(spekears, value=spekears[1], label="Narrator", info="Select a narrator."
109
  ),
110
  gr.Dropdown(emotions, label="Emotion 1", info="Select first emotion"),
model/__pycache__/__init__.cpython-39.pyc CHANGED
Binary files a/model/__pycache__/__init__.cpython-39.pyc and b/model/__pycache__/__init__.cpython-39.pyc differ
 
model/__pycache__/base.cpython-39.pyc ADDED
Binary file (1.34 kB). View file
 
model/__pycache__/classifier.cpython-39.pyc ADDED
Binary file (20.1 kB). View file
 
model/__pycache__/diffusion.cpython-39.pyc ADDED
Binary file (15.6 kB). View file
 
model/__pycache__/text_encoder.cpython-39.pyc ADDED
Binary file (10.9 kB). View file
 
model/__pycache__/tts.cpython-39.pyc CHANGED
Binary files a/model/__pycache__/tts.cpython-39.pyc and b/model/__pycache__/tts.cpython-39.pyc differ
 
model/__pycache__/utils.cpython-39.pyc ADDED
Binary file (1.71 kB). View file
 
text/__pycache__/__init__.cpython-39.pyc ADDED
Binary file (3.74 kB). View file
 
text/__pycache__/cleaners.cpython-39.pyc ADDED
Binary file (2.11 kB). View file
 
text/__pycache__/cmudict.cpython-39.pyc ADDED
Binary file (2.24 kB). View file
 
text/__pycache__/symbols.cpython-39.pyc ADDED
Binary file (830 Bytes). View file