|
{ |
|
"base_config": "config/vocoder.json", |
|
"model_type": "DiffusionVocoder", |
|
|
|
"dataset": [ |
|
"csd", |
|
"kising", |
|
"m4singer", |
|
"nus48e", |
|
"opencpop", |
|
"opensinger", |
|
"opera", |
|
"pjs", |
|
"popbutfy", |
|
"popcs", |
|
"ljspeech", |
|
"vctk", |
|
"libritts", |
|
], |
|
"dataset_path": { |
|
|
|
"csd": "[dataset path]", |
|
"kising": "[dataset path]", |
|
"m4singer": "[dataset path]", |
|
"nus48e": "[dataset path]", |
|
"opencpop": "[dataset path]", |
|
"opensinger": "[dataset path]", |
|
"opera": "[dataset path]", |
|
"pjs": "[dataset path]", |
|
"popbutfy": "[dataset path]", |
|
"popcs": "[dataset path]", |
|
"ljspeech": "[dataset path]", |
|
"vctk": "[dataset path]", |
|
"libritts": "[dataset path]", |
|
}, |
|
|
|
"log_dir": "ckpts/vocoder", |
|
"preprocess": { |
|
|
|
"extract_mel": true, |
|
"extract_audio": true, |
|
"extract_pitch": false, |
|
"extract_uv": false, |
|
"pitch_extractor": "parselmouth", |
|
|
|
|
|
"use_mel": true, |
|
"use_frame_pitch": false, |
|
"use_uv": false, |
|
"use_audio": true, |
|
|
|
|
|
"processed_dir": "data/", |
|
"n_mel": 100, |
|
"sample_rate": 24000 |
|
}, |
|
"train": { |
|
|
|
"batch_size": 32, |
|
"max_epoch": 1000000, |
|
"save_checkpoint_stride": [20], |
|
"adamw": { |
|
"lr": 2.0e-4, |
|
"adam_b1": 0.8, |
|
"adam_b2": 0.99 |
|
}, |
|
"exponential_lr": { |
|
"lr_decay": 0.999 |
|
}, |
|
} |
|
} |