t1 / config.yml
duongmle's picture
Upload config.yml
3559d52
allow_cache: true
batch_size: 1
config: ./ttsexamples/tacotron2/conf/tacotron2.v1.yaml
dev_dir: /content/dump_ljspeech/valid
end_ratio_value: 0.0
eval_interval_steps: 50
format: npy
gradient_accumulation_steps: 1
hop_size: 256
is_shuffle: true
log_interval_steps: 20
max_char_length: 128
max_mel_length: 257
mel_length_threshold: 32
mixed_precision: false
model_type: tacotron2
num_save_intermediate_results: 1
optimizer_params: {decay_steps: 150000, end_learning_rate: 1.0e-05, initial_learning_rate: 0.001,
warmup_proportion: 0.02, weight_decay: 0.001}
outdir: ./ttsexamples/tacotron2/exp/train.tacotron2.v1/
pretrained: ''
remove_short_samples: true
resume: ''
save_interval_steps: 20
schedule_decay_steps: 50000
start_ratio_value: 0.5
start_schedule_teacher_forcing: 200001
tacotron2_params: {attention_dim: 128, attention_filters: 32, attention_kernel: 31,
attention_type: lsa, dataset: ljspeech, decoder_lstm_units: 1024, embedding_dropout_prob: 0.1,
embedding_hidden_size: 512, encoder_conv_activation: relu, encoder_conv_dropout_rate: 0.5,
encoder_conv_filters: 512, encoder_conv_kernel_sizes: 5, encoder_lstm_units: 256,
initializer_range: 0.02, n_conv_encoder: 5, n_conv_postnet: 5, n_lstm_decoder: 1,
n_mels: 80, n_prenet_layers: 2, n_speakers: 1, postnet_conv_filters: 512, postnet_conv_kernel_sizes: 5,
postnet_dropout_rate: 0.1, prenet_activation: relu, prenet_dropout_rate: 0.5, prenet_units: 256,
reduction_factor: 1}
train_dir: /content/dump_ljspeech/train
train_max_steps: 200000
use_fal: false
use_fixed_shapes: true
use_norm: true
var_train_expr: null
verbose: 1
version: '0.0'