trocr-large-handwritten-fr / trainer_state.json
agomberto's picture
:tada: update model 20230703
e75e7f4
raw
history blame
7.2 kB
{
"best_metric": 0.5421165227890015,
"best_model_checkpoint": "./20230701_models/checkpoint-1099",
"epoch": 19.94540491355778,
"global_step": 5480,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 1.0,
"eval_cer": 0.10819683151455398,
"eval_loss": 0.6883996725082397,
"eval_runtime": 259.3566,
"eval_samples_per_second": 8.143,
"eval_steps_per_second": 0.509,
"eval_wer": 0.26681723843242583,
"step": 274
},
{
"epoch": 1.82,
"learning_rate": 3.635766423357665e-05,
"loss": 0.9397,
"step": 500
},
{
"epoch": 2.0,
"eval_cer": 0.08392901158491496,
"eval_loss": 0.5709623694419861,
"eval_runtime": 251.7707,
"eval_samples_per_second": 8.389,
"eval_steps_per_second": 0.524,
"eval_wer": 0.2248809669149066,
"step": 549
},
{
"epoch": 3.0,
"eval_cer": 0.07773321083648912,
"eval_loss": 0.5516401529312134,
"eval_runtime": 253.1328,
"eval_samples_per_second": 8.343,
"eval_steps_per_second": 0.521,
"eval_wer": 0.20919301672567453,
"step": 824
},
{
"epoch": 3.64,
"learning_rate": 3.270802919708029e-05,
"loss": 0.2569,
"step": 1000
},
{
"epoch": 4.0,
"eval_cer": 0.07259058417549914,
"eval_loss": 0.5421165227890015,
"eval_runtime": 253.562,
"eval_samples_per_second": 8.329,
"eval_steps_per_second": 0.521,
"eval_wer": 0.20198998901233062,
"step": 1099
},
{
"epoch": 5.0,
"eval_cer": 0.07377820601877787,
"eval_loss": 0.5494938492774963,
"eval_runtime": 254.0497,
"eval_samples_per_second": 8.313,
"eval_steps_per_second": 0.52,
"eval_wer": 0.2014406055426688,
"step": 1373
},
{
"epoch": 5.46,
"learning_rate": 2.9058394160583945e-05,
"loss": 0.109,
"step": 1500
},
{
"epoch": 6.0,
"eval_cer": 0.07154861406771686,
"eval_loss": 0.5665440559387207,
"eval_runtime": 253.9146,
"eval_samples_per_second": 8.318,
"eval_steps_per_second": 0.52,
"eval_wer": 0.1971676230008546,
"step": 1648
},
{
"epoch": 7.0,
"eval_cer": 0.07226566876554552,
"eval_loss": 0.5868140459060669,
"eval_runtime": 253.2966,
"eval_samples_per_second": 8.338,
"eval_steps_per_second": 0.521,
"eval_wer": 0.1968624099621536,
"step": 1923
},
{
"epoch": 7.28,
"learning_rate": 2.5408759124087593e-05,
"loss": 0.0481,
"step": 2000
},
{
"epoch": 8.0,
"eval_cer": 0.07029376834651668,
"eval_loss": 0.5920885801315308,
"eval_runtime": 252.718,
"eval_samples_per_second": 8.357,
"eval_steps_per_second": 0.522,
"eval_wer": 0.19570260041508974,
"step": 2198
},
{
"epoch": 9.0,
"eval_cer": 0.07013691263136666,
"eval_loss": 0.5932603478431702,
"eval_runtime": 254.5349,
"eval_samples_per_second": 8.297,
"eval_steps_per_second": 0.519,
"eval_wer": 0.19374923696740326,
"step": 2472
},
{
"epoch": 9.1,
"learning_rate": 2.1759124087591242e-05,
"loss": 0.022,
"step": 2500
},
{
"epoch": 10.0,
"eval_cer": 0.06856835547986645,
"eval_loss": 0.6067739725112915,
"eval_runtime": 253.5231,
"eval_samples_per_second": 8.331,
"eval_steps_per_second": 0.521,
"eval_wer": 0.1925894274203394,
"step": 2747
},
{
"epoch": 10.92,
"learning_rate": 1.8116788321167883e-05,
"loss": 0.0108,
"step": 3000
},
{
"epoch": 11.0,
"eval_cer": 0.06744795751450916,
"eval_loss": 0.6042998433113098,
"eval_runtime": 253.2695,
"eval_samples_per_second": 8.339,
"eval_steps_per_second": 0.521,
"eval_wer": 0.1902087657184715,
"step": 3022
},
{
"epoch": 12.0,
"eval_cer": 0.06674210679633406,
"eval_loss": 0.6130247116088867,
"eval_runtime": 253.5585,
"eval_samples_per_second": 8.329,
"eval_steps_per_second": 0.521,
"eval_wer": 0.18856061530948603,
"step": 3297
},
{
"epoch": 12.74,
"learning_rate": 1.4467153284671533e-05,
"loss": 0.0052,
"step": 3500
},
{
"epoch": 13.0,
"eval_cer": 0.0659802361798911,
"eval_loss": 0.6161753535270691,
"eval_runtime": 254.095,
"eval_samples_per_second": 8.312,
"eval_steps_per_second": 0.519,
"eval_wer": 0.1861799536076181,
"step": 3571
},
{
"epoch": 14.0,
"eval_cer": 0.06466937056042306,
"eval_loss": 0.6252880692481995,
"eval_runtime": 254.0952,
"eval_samples_per_second": 8.312,
"eval_steps_per_second": 0.519,
"eval_wer": 0.18471493102185324,
"step": 3846
},
{
"epoch": 14.56,
"learning_rate": 1.0817518248175182e-05,
"loss": 0.0028,
"step": 4000
},
{
"epoch": 15.0,
"eval_cer": 0.06428843525220158,
"eval_loss": 0.6240524649620056,
"eval_runtime": 253.6298,
"eval_samples_per_second": 8.327,
"eval_steps_per_second": 0.52,
"eval_wer": 0.18270052496642655,
"step": 4121
},
{
"epoch": 16.0,
"eval_cer": 0.06460214668250162,
"eval_loss": 0.6327393054962158,
"eval_runtime": 254.0581,
"eval_samples_per_second": 8.313,
"eval_steps_per_second": 0.52,
"eval_wer": 0.18428763276767182,
"step": 4396
},
{
"epoch": 16.38,
"learning_rate": 7.167883211678832e-06,
"loss": 0.0016,
"step": 4500
},
{
"epoch": 17.0,
"eval_cer": 0.0632464651444193,
"eval_loss": 0.6320570707321167,
"eval_runtime": 253.728,
"eval_samples_per_second": 8.324,
"eval_steps_per_second": 0.52,
"eval_wer": 0.18190697106580392,
"step": 4670
},
{
"epoch": 18.0,
"eval_cer": 0.06377305218813722,
"eval_loss": 0.6347479224205017,
"eval_runtime": 254.3801,
"eval_samples_per_second": 8.303,
"eval_steps_per_second": 0.519,
"eval_wer": 0.18239531192772554,
"step": 4945
},
{
"epoch": 18.2,
"learning_rate": 3.5182481751824822e-06,
"loss": 0.0011,
"step": 5000
},
{
"epoch": 19.0,
"eval_cer": 0.06367221637125507,
"eval_loss": 0.6383982300758362,
"eval_runtime": 254.2837,
"eval_samples_per_second": 8.306,
"eval_steps_per_second": 0.519,
"eval_wer": 0.1815407154193627,
"step": 5220
},
{
"epoch": 19.95,
"eval_cer": 0.06354897259506577,
"eval_loss": 0.6386234164237976,
"eval_runtime": 253.9317,
"eval_samples_per_second": 8.317,
"eval_steps_per_second": 0.52,
"eval_wer": 0.18233426931998534,
"step": 5480
}
],
"max_steps": 5480,
"num_train_epochs": 20,
"total_flos": 9.42327114459343e+20,
"trial_name": null,
"trial_params": null
}