waveformer / default_config.json
bandhav's picture
Base code
e6a6383
{
"model": "src.training.dcc_tf",
"model_params":
{
"label_len": 41,
"L": 32,
"enc_dim": 512,
"num_enc_layers": 10,
"dec_dim": 256,
"num_dec_layers": 1,
"dec_buf_len": 13,
"dec_chunk_size": 13,
"out_buf_len": 4,
"use_pos_enc": "true"
},
"train_data":
{
"input_dir": "data/FSDSoundScapes",
"dset": "train",
"sr": 44100,
"resample_rate": null,
"max_num_targets":3
},
"val_data":
{
"input_dir": "data/FSDSoundScapes",
"dset": "val",
"sr": 44100,
"resample_rate": null,
"max_num_targets":3
},
"test_data":
{
"input_dir": "data/FSDSoundScapes",
"dset": "test",
"sr": 44100,
"resample_rate": null,
"max_num_targets":3
},
"optim":
{
"lr": 5e-4,
"weight_decay": 0.0
},
"lr_sched":
{
"mode": "max",
"factor": 0.1,
"patience": 5,
"min_lr": 5e-6,
"threshold": 0.1,
"threshold_mode": "abs"
},
"base_metric": "scale_invariant_signal_noise_ratio",
"fix_lr_epochs": 50,
"epochs": 150,
"batch_size": 16,
"eval_batch_size": 64,
"n_workers": 16
}