|
{ |
|
"best_metric": null, |
|
"best_model_checkpoint": null, |
|
"epoch": 79.992, |
|
"global_step": 4960, |
|
"is_hyper_param_search": false, |
|
"is_local_process_zero": true, |
|
"is_world_process_zero": true, |
|
"log_history": [ |
|
{ |
|
"epoch": 4.83, |
|
"learning_rate": 0.00017999999999999998, |
|
"loss": 5.8789, |
|
"step": 300 |
|
}, |
|
{ |
|
"epoch": 4.83, |
|
"eval_loss": 3.1512646675109863, |
|
"eval_runtime": 167.7164, |
|
"eval_samples_per_second": 9.82, |
|
"eval_wer": 1.0, |
|
"step": 300 |
|
}, |
|
{ |
|
"epoch": 9.67, |
|
"learning_rate": 0.00029327354260089687, |
|
"loss": 1.8544, |
|
"step": 600 |
|
}, |
|
{ |
|
"epoch": 9.67, |
|
"eval_loss": 0.4943191707134247, |
|
"eval_runtime": 170.9272, |
|
"eval_samples_per_second": 9.636, |
|
"eval_wer": 0.5103553299492386, |
|
"step": 600 |
|
}, |
|
{ |
|
"epoch": 14.51, |
|
"learning_rate": 0.0002730941704035874, |
|
"loss": 0.2628, |
|
"step": 900 |
|
}, |
|
{ |
|
"epoch": 14.51, |
|
"eval_loss": 0.46906277537345886, |
|
"eval_runtime": 172.4339, |
|
"eval_samples_per_second": 9.551, |
|
"eval_wer": 0.43147208121827413, |
|
"step": 900 |
|
}, |
|
{ |
|
"epoch": 19.35, |
|
"learning_rate": 0.000252914798206278, |
|
"loss": 0.124, |
|
"step": 1200 |
|
}, |
|
{ |
|
"epoch": 19.35, |
|
"eval_loss": 0.4130130708217621, |
|
"eval_runtime": 172.8773, |
|
"eval_samples_per_second": 9.527, |
|
"eval_wer": 0.36, |
|
"step": 1200 |
|
}, |
|
{ |
|
"epoch": 24.19, |
|
"learning_rate": 0.0002327354260089686, |
|
"loss": 0.0857, |
|
"step": 1500 |
|
}, |
|
{ |
|
"epoch": 24.19, |
|
"eval_loss": 0.43019285798072815, |
|
"eval_runtime": 176.7931, |
|
"eval_samples_per_second": 9.316, |
|
"eval_wer": 0.3513705583756345, |
|
"step": 1500 |
|
}, |
|
{ |
|
"epoch": 29.03, |
|
"learning_rate": 0.00021255605381165918, |
|
"loss": 0.0653, |
|
"step": 1800 |
|
}, |
|
{ |
|
"epoch": 29.03, |
|
"eval_loss": 0.4362075626850128, |
|
"eval_runtime": 190.6223, |
|
"eval_samples_per_second": 8.64, |
|
"eval_wer": 0.3595939086294416, |
|
"step": 1800 |
|
}, |
|
{ |
|
"epoch": 33.86, |
|
"learning_rate": 0.00019237668161434975, |
|
"loss": 0.0632, |
|
"step": 2100 |
|
}, |
|
{ |
|
"epoch": 33.86, |
|
"eval_loss": 0.4273272156715393, |
|
"eval_runtime": 177.8151, |
|
"eval_samples_per_second": 9.262, |
|
"eval_wer": 0.33390862944162436, |
|
"step": 2100 |
|
}, |
|
{ |
|
"epoch": 38.7, |
|
"learning_rate": 0.00017219730941704035, |
|
"loss": 0.0499, |
|
"step": 2400 |
|
}, |
|
{ |
|
"epoch": 38.7, |
|
"eval_loss": 0.4455905258655548, |
|
"eval_runtime": 177.4805, |
|
"eval_samples_per_second": 9.28, |
|
"eval_wer": 0.32558375634517767, |
|
"step": 2400 |
|
}, |
|
{ |
|
"epoch": 43.54, |
|
"learning_rate": 0.00015201793721973095, |
|
"loss": 0.0412, |
|
"step": 2700 |
|
}, |
|
{ |
|
"epoch": 43.54, |
|
"eval_loss": 0.4279979467391968, |
|
"eval_runtime": 179.3129, |
|
"eval_samples_per_second": 9.185, |
|
"eval_wer": 0.3316751269035533, |
|
"step": 2700 |
|
}, |
|
{ |
|
"epoch": 48.38, |
|
"learning_rate": 0.00013183856502242152, |
|
"loss": 0.0428, |
|
"step": 3000 |
|
}, |
|
{ |
|
"epoch": 48.38, |
|
"eval_loss": 0.42648839950561523, |
|
"eval_runtime": 179.9053, |
|
"eval_samples_per_second": 9.155, |
|
"eval_wer": 0.3197969543147208, |
|
"step": 3000 |
|
}, |
|
{ |
|
"epoch": 53.22, |
|
"learning_rate": 0.0001116591928251121, |
|
"loss": 0.0345, |
|
"step": 3300 |
|
}, |
|
{ |
|
"epoch": 53.22, |
|
"eval_loss": 0.46762773394584656, |
|
"eval_runtime": 179.9553, |
|
"eval_samples_per_second": 9.152, |
|
"eval_wer": 0.31228426395939085, |
|
"step": 3300 |
|
}, |
|
{ |
|
"epoch": 58.06, |
|
"learning_rate": 9.147982062780269e-05, |
|
"loss": 0.0335, |
|
"step": 3600 |
|
}, |
|
{ |
|
"epoch": 58.06, |
|
"eval_loss": 0.4403984248638153, |
|
"eval_runtime": 181.1578, |
|
"eval_samples_per_second": 9.092, |
|
"eval_wer": 0.3096446700507614, |
|
"step": 3600 |
|
}, |
|
{ |
|
"epoch": 62.9, |
|
"learning_rate": 7.130044843049327e-05, |
|
"loss": 0.0308, |
|
"step": 3900 |
|
}, |
|
{ |
|
"epoch": 62.9, |
|
"eval_loss": 0.4584444463253021, |
|
"eval_runtime": 182.2608, |
|
"eval_samples_per_second": 9.036, |
|
"eval_wer": 0.3082233502538071, |
|
"step": 3900 |
|
}, |
|
{ |
|
"epoch": 67.74, |
|
"learning_rate": 5.112107623318385e-05, |
|
"loss": 0.0253, |
|
"step": 4200 |
|
}, |
|
{ |
|
"epoch": 67.74, |
|
"eval_loss": 0.4203069806098938, |
|
"eval_runtime": 182.5783, |
|
"eval_samples_per_second": 9.021, |
|
"eval_wer": 0.3001015228426396, |
|
"step": 4200 |
|
}, |
|
{ |
|
"epoch": 72.58, |
|
"learning_rate": 3.094170403587444e-05, |
|
"loss": 0.0243, |
|
"step": 4500 |
|
}, |
|
{ |
|
"epoch": 72.58, |
|
"eval_loss": 0.43954339623451233, |
|
"eval_runtime": 183.1424, |
|
"eval_samples_per_second": 8.993, |
|
"eval_wer": 0.29736040609137054, |
|
"step": 4500 |
|
}, |
|
{ |
|
"epoch": 77.42, |
|
"learning_rate": 1.0762331838565022e-05, |
|
"loss": 0.0229, |
|
"step": 4800 |
|
}, |
|
{ |
|
"epoch": 77.42, |
|
"eval_loss": 0.44123971462249756, |
|
"eval_runtime": 183.8976, |
|
"eval_samples_per_second": 8.956, |
|
"eval_wer": 0.29218274111675124, |
|
"step": 4800 |
|
}, |
|
{ |
|
"epoch": 79.99, |
|
"step": 4960, |
|
"total_flos": 3.4759190857567523e+19, |
|
"train_runtime": 32940.4351, |
|
"train_samples_per_second": 0.151 |
|
} |
|
], |
|
"max_steps": 4960, |
|
"num_train_epochs": 80, |
|
"total_flos": 3.4759190857567523e+19, |
|
"trial_name": null, |
|
"trial_params": null |
|
} |
|
|