fastspeech2-mf1 / config.yaml
arampacha's picture
model
2c10c45
raw
history blame
608 Bytes
audio_root: ./
features:
energy_max: 5.850490093231201
energy_min: 0.0
eps: 1.0e-05
f_max: 8000
f_min: 0
hop_len_t: 0.011609977324263039
hop_length: 256
n_fft: 1024
n_mels: 80
n_stft: 513
pitch_max: 6.524898211542482
pitch_min: 1.0e-08
sample_rate: 22050
type: spectrogram+melscale+log
win_len_t: 0.046439909297052155
win_length: 1024
window_fn: hann
global_cmvn:
stats_npz_path: gcmvn_stats.npz
sample_rate: 22050
transforms:
'*':
- global_cmvn
vocab_filename: vocab.txt
vocoder:
type: hifigan
config: hifigan.json
checkpoint: hifigan.bin
hub:
phonemizer: g2p