eureqa / model /trainer_state.json
ThreeBlessings's picture
Added application file
2a4326f
raw
history blame
10.2 kB
{
"best_metric": null,
"best_model_checkpoint": null,
"epoch": 2.0,
"eval_steps": 2000,
"global_step": 21994,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 0,
"eval_HasAns_exact": 0.06747638326585695,
"eval_HasAns_f1": 7.18502154989456,
"eval_HasAns_total": 5928,
"eval_NoAns_exact": 0.0336417157275021,
"eval_NoAns_f1": 0.0336417157275021,
"eval_NoAns_total": 5945,
"eval_best_exact": 50.07159100480081,
"eval_best_exact_thresh": 0.0,
"eval_best_f1": 50.075846569172874,
"eval_best_f1_thresh": 0.0,
"eval_exact": 0.050534826918217805,
"eval_f1": 3.6042118881306284,
"eval_runtime": -14.2699,
"eval_samples_per_second": -852.912,
"eval_steps_per_second": -13.385,
"eval_total": 11873,
"step": 0
},
{
"epoch": 0.18186778212239701,
"grad_norm": 40.6475715637207,
"learning_rate": 2.7271983268164044e-05,
"loss": 1.4132,
"step": 2000
},
{
"epoch": 0.18186778212239701,
"eval_HasAns_exact": 67.25708502024291,
"eval_HasAns_f1": 74.98296116605809,
"eval_HasAns_total": 5928,
"eval_NoAns_exact": 70.81581160639193,
"eval_NoAns_f1": 70.81581160639193,
"eval_NoAns_total": 5945,
"eval_best_exact": 69.03899604143855,
"eval_best_exact_thresh": 0.0,
"eval_best_f1": 72.89640308198375,
"eval_best_f1_thresh": 0.0,
"eval_exact": 69.03899604143855,
"eval_f1": 72.89640308198369,
"eval_runtime": 136.0827,
"eval_samples_per_second": 89.438,
"eval_steps_per_second": 1.404,
"eval_total": 11873,
"step": 2000
},
{
"epoch": 0.36373556424479403,
"grad_norm": 41.061927795410156,
"learning_rate": 2.4543966536328087e-05,
"loss": 1.2638,
"step": 4000
},
{
"epoch": 0.36373556424479403,
"eval_HasAns_exact": 73.59986504723346,
"eval_HasAns_f1": 81.00757791997825,
"eval_HasAns_total": 5928,
"eval_NoAns_exact": 65.78637510513036,
"eval_NoAns_f1": 65.78637510513036,
"eval_NoAns_total": 5945,
"eval_best_exact": 69.68752632022235,
"eval_best_exact_thresh": 0.0,
"eval_best_f1": 73.38607950051664,
"eval_best_f1_thresh": 0.0,
"eval_exact": 69.68752632022235,
"eval_f1": 73.38607950051639,
"eval_runtime": 136.2286,
"eval_samples_per_second": 89.342,
"eval_steps_per_second": 1.402,
"eval_total": 11873,
"step": 4000
},
{
"epoch": 0.5456033463671911,
"grad_norm": 52.56464767456055,
"learning_rate": 2.1815949804492137e-05,
"loss": 1.3977,
"step": 6000
},
{
"epoch": 0.5456033463671911,
"eval_HasAns_exact": 71.94669365721997,
"eval_HasAns_f1": 79.2064004599959,
"eval_HasAns_total": 5928,
"eval_NoAns_exact": 72.17830109335576,
"eval_NoAns_f1": 72.17830109335576,
"eval_NoAns_total": 5945,
"eval_best_exact": 72.07108565653162,
"eval_best_exact_thresh": 0.0,
"eval_best_f1": 75.69574176087386,
"eval_best_f1_thresh": 0.0,
"eval_exact": 72.0626631853786,
"eval_f1": 75.68731928972085,
"eval_runtime": 136.1854,
"eval_samples_per_second": 89.371,
"eval_steps_per_second": 1.403,
"eval_total": 11873,
"step": 6000
},
{
"epoch": 0.7274711284895881,
"grad_norm": 49.72623825073242,
"learning_rate": 1.908793307265618e-05,
"loss": 1.3384,
"step": 8000
},
{
"epoch": 0.7274711284895881,
"eval_HasAns_exact": 72.0310391363023,
"eval_HasAns_f1": 78.95689148837117,
"eval_HasAns_total": 5928,
"eval_NoAns_exact": 75.00420521446594,
"eval_NoAns_f1": 75.00420521446594,
"eval_NoAns_total": 5945,
"eval_best_exact": 73.51975069485387,
"eval_best_exact_thresh": 0.0,
"eval_best_f1": 76.9777185835984,
"eval_best_f1_thresh": 0.0,
"eval_exact": 73.51975069485387,
"eval_f1": 76.97771858359845,
"eval_runtime": 135.7796,
"eval_samples_per_second": 89.638,
"eval_steps_per_second": 1.407,
"eval_total": 11873,
"step": 8000
},
{
"epoch": 0.9093389106119851,
"grad_norm": 39.458927154541016,
"learning_rate": 1.6359916340820223e-05,
"loss": 1.2258,
"step": 10000
},
{
"epoch": 0.9093389106119851,
"eval_HasAns_exact": 73.54925775978407,
"eval_HasAns_f1": 80.29283351227244,
"eval_HasAns_total": 5928,
"eval_NoAns_exact": 76.23212783851976,
"eval_NoAns_f1": 76.23212783851976,
"eval_NoAns_total": 5945,
"eval_best_exact": 74.88419102164575,
"eval_best_exact_thresh": 0.0,
"eval_best_f1": 78.25115110424915,
"eval_best_f1_thresh": 0.0,
"eval_exact": 74.89261349279879,
"eval_f1": 78.25957357540227,
"eval_runtime": 136.1576,
"eval_samples_per_second": 89.389,
"eval_steps_per_second": 1.403,
"eval_total": 11873,
"step": 10000
},
{
"epoch": 1.0912066927343822,
"grad_norm": 41.23106002807617,
"learning_rate": 1.363189960898427e-05,
"loss": 0.7822,
"step": 12000
},
{
"epoch": 1.0912066927343822,
"eval_HasAns_exact": 77.26045883940621,
"eval_HasAns_f1": 84.1124672080756,
"eval_HasAns_total": 5928,
"eval_NoAns_exact": 69.97476871320437,
"eval_NoAns_f1": 69.97476871320437,
"eval_NoAns_total": 5945,
"eval_best_exact": 73.6208203486903,
"eval_best_exact_thresh": 0.0,
"eval_best_f1": 77.04191911138483,
"eval_best_f1_thresh": 0.0,
"eval_exact": 73.61239787753728,
"eval_f1": 77.0334966402318,
"eval_runtime": 135.9367,
"eval_samples_per_second": 89.534,
"eval_steps_per_second": 1.405,
"eval_total": 11873,
"step": 12000
},
{
"epoch": 1.273074474856779,
"grad_norm": 21.682905197143555,
"learning_rate": 1.0903882877148312e-05,
"loss": 0.6771,
"step": 14000
},
{
"epoch": 1.273074474856779,
"eval_HasAns_exact": 73.78542510121457,
"eval_HasAns_f1": 80.35769680092089,
"eval_HasAns_total": 5928,
"eval_NoAns_exact": 80.7569386038688,
"eval_NoAns_f1": 80.7569386038688,
"eval_NoAns_total": 5945,
"eval_best_exact": 77.27617282910806,
"eval_best_exact_thresh": 0.0,
"eval_best_f1": 80.55760352361308,
"eval_best_f1_thresh": 0.0,
"eval_exact": 77.27617282910806,
"eval_f1": 80.55760352361317,
"eval_runtime": 136.5688,
"eval_samples_per_second": 89.12,
"eval_steps_per_second": 1.399,
"eval_total": 11873,
"step": 14000
},
{
"epoch": 1.4549422569791761,
"grad_norm": 56.2855339050293,
"learning_rate": 8.175866145312359e-06,
"loss": 0.6521,
"step": 16000
},
{
"epoch": 1.4549422569791761,
"eval_HasAns_exact": 71.82860998650472,
"eval_HasAns_f1": 77.91336965584932,
"eval_HasAns_total": 5928,
"eval_NoAns_exact": 85.18082422203533,
"eval_NoAns_f1": 85.18082422203533,
"eval_NoAns_total": 5945,
"eval_best_exact": 78.52269855975743,
"eval_best_exact_thresh": 0.0,
"eval_best_f1": 81.56072225384261,
"eval_best_f1_thresh": 0.0,
"eval_exact": 78.51427608860439,
"eval_f1": 81.55229978268969,
"eval_runtime": 136.3366,
"eval_samples_per_second": 89.272,
"eval_steps_per_second": 1.401,
"eval_total": 11873,
"step": 16000
},
{
"epoch": 1.6368100391015732,
"grad_norm": 24.467727661132812,
"learning_rate": 5.447849413476403e-06,
"loss": 0.6455,
"step": 18000
},
{
"epoch": 1.6368100391015732,
"eval_HasAns_exact": 75.57354925775978,
"eval_HasAns_f1": 82.12994203860852,
"eval_HasAns_total": 5928,
"eval_NoAns_exact": 79.0412111017662,
"eval_NoAns_f1": 79.0412111017662,
"eval_NoAns_total": 5945,
"eval_best_exact": 77.31828518487325,
"eval_best_exact_thresh": 0.0,
"eval_best_f1": 80.59178778782702,
"eval_best_f1_thresh": 0.0,
"eval_exact": 77.30986271372021,
"eval_f1": 80.58336531667406,
"eval_runtime": 136.1893,
"eval_samples_per_second": 89.368,
"eval_steps_per_second": 1.402,
"eval_total": 11873,
"step": 18000
},
{
"epoch": 1.8186778212239703,
"grad_norm": 36.233985900878906,
"learning_rate": 2.7198326816404476e-06,
"loss": 0.6175,
"step": 20000
},
{
"epoch": 1.8186778212239703,
"eval_HasAns_exact": 74.19028340080972,
"eval_HasAns_f1": 80.57880057678263,
"eval_HasAns_total": 5928,
"eval_NoAns_exact": 83.46509671993272,
"eval_NoAns_f1": 83.46509671993272,
"eval_NoAns_total": 5945,
"eval_best_exact": 78.83432999241978,
"eval_best_exact_thresh": 0.0,
"eval_best_f1": 82.02401497676792,
"eval_best_f1_thresh": 0.0,
"eval_exact": 78.83432999241978,
"eval_f1": 82.02401497676809,
"eval_runtime": 136.3043,
"eval_samples_per_second": 89.293,
"eval_steps_per_second": 1.401,
"eval_total": 11873,
"step": 20000
},
{
"epoch": 2.0,
"step": 21994,
"total_flos": 4371201741330432.0,
"train_loss": 0.9652459149015072,
"train_runtime": 5408.776,
"train_samples_per_second": 48.794,
"train_steps_per_second": 4.066
}
],
"logging_steps": 2000,
"max_steps": 21994,
"num_input_tokens_seen": 0,
"num_train_epochs": 2,
"save_steps": 2000,
"stateful_callbacks": {
"TrainerControl": {
"args": {
"should_epoch_stop": false,
"should_evaluate": false,
"should_log": false,
"should_save": true,
"should_training_stop": true
},
"attributes": {}
}
},
"total_flos": 4371201741330432.0,
"train_batch_size": 12,
"trial_name": null,
"trial_params": null
}