Spaces:

NATSpeech
/

DiffSpeech

Runtime error

RayeRen commited on Feb 7, 2022

Commit

e75aa39

•

1 Parent(s): 15e73a1

update

Files changed (4) hide show

inference/tts/gradio/gradio_settings.yaml CHANGED Viewed

@@ -1,12 +1,12 @@
-title: 'NATSpeech/FastSpeech 2'
 description: |
-  Gradio demo for NATSpeech/FastSpeech 2. To use it, simply add your audio, or click one of the examples to load them. Note: This space is running on CPU, inference times will be higher.
 article: |
-  Link to <a href='https://github.com/NATSpeech/NATSpeech/blob/main/docs/fastspeech2.md' style='color:blue;' target='_blank\'>Github REPO</a>
 example_inputs:
   - |-
     the invention of movable metal letters in the middle of the fifteenth century may justly be considered as the invention of the art of printing.
   - |-
     produced the block books, which were the immediate predecessors of the true printed book,
-inference_cls: inference.tts.fs2_orig.FastSpeech2OrigInfer
-exp_name: fs2_exp

+title: 'NATSpeech/PortaSpeech'
 description: |
+  Gradio demo for NATSpeech/PortaSpeech. To use it, simply add your audio, or click one of the examples to load them. Note: This space is running on CPU, inference times will be higher.
 article: |
+  Link to <a href='https://github.com/NATSpeech/NATSpeech/blob/main/docs/portaspeech.md' style='color:blue;' target='_blank\'>Github REPO</a>
 example_inputs:
   - |-
     the invention of movable metal letters in the middle of the fifteenth century may justly be considered as the invention of the art of printing.
   - |-
     produced the block books, which were the immediate predecessors of the true printed book,
+inference_cls: inference.tts.ps_flow.PortaSpeechFlowInfer
+exp_name: ps_normal_exp

inference/tts/ps_flow.py CHANGED Viewed

@@ -10,8 +10,9 @@ class PortaSpeechFlowInfer(BaseTTSInfer):
         ph_dict_size = len(self.ph_encoder)
         word_dict_size = len(self.word_encoder)
         model = PortaSpeechFlow(ph_dict_size, word_dict_size, self.hparams)
-        model.eval()
         load_ckpt(model, hparams['work_dir'], 'model')
         return model
     def forward_model(self, inp):

         ph_dict_size = len(self.ph_encoder)
         word_dict_size = len(self.word_encoder)
         model = PortaSpeechFlow(ph_dict_size, word_dict_size, self.hparams)
         load_ckpt(model, hparams['work_dir'], 'model')
+        model.post_flow.store_inverse()
+        model.eval()
         return model
     def forward_model(self, inp):

modules/tts/portaspeech/fvae.py CHANGED Viewed

@@ -125,7 +125,7 @@ class FVAE(nn.Module):
             return z_q, loss_kl, z_p, m_q, logs_q
         else:
             latent_shape = [cond_sqz.shape[0], self.latent_size, cond_sqz.shape[2]]
-            z_p = self.prior_dist.sample(latent_shape).to(cond.device) * noise_scale
             if self.use_prior_flow:
                 z_p = self.prior_flow(z_p, 1, cond_sqz, reverse=True)
             return z_p

             return z_q, loss_kl, z_p, m_q, logs_q
         else:
             latent_shape = [cond_sqz.shape[0], self.latent_size, cond_sqz.shape[2]]
+            z_p = torch.randn(latent_shape).to(cond.device) * noise_scale
             if self.use_prior_flow:
                 z_p = self.prior_flow(z_p, 1, cond_sqz, reverse=True)
             return z_p

modules/tts/portaspeech/portaspeech_flow.py CHANGED Viewed

@@ -70,6 +70,6 @@ class PortaSpeechFlow(PortaSpeech):
                 ret['postflow'] = None
         else:
             nonpadding = torch.ones_like(x_recon[:, :1, :])
-            z_post = prior_dist.sample(x_recon.shape).to(g.device) * self.hparams['noise_scale']
             x_recon, _ = self.post_flow(z_post, nonpadding, g, reverse=True)
             ret['mel_out'] = x_recon.transpose(1, 2)

                 ret['postflow'] = None
         else:
             nonpadding = torch.ones_like(x_recon[:, :1, :])
+            z_post = torch.randn(x_recon.shape).to(g.device) * self.hparams['noise_scale']
             x_recon, _ = self.post_flow(z_post, nonpadding, g, reverse=True)
             ret['mel_out'] = x_recon.transpose(1, 2)