nerugm-base-0 / trainer_state.json
apwic's picture
End of training
5788f3c verified
raw
history blame
145 kB
{
"best_metric": null,
"best_model_checkpoint": null,
"epoch": 100.0,
"eval_steps": 500,
"global_step": 10600,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 1.0,
"grad_norm": 3.0579540729522705,
"learning_rate": 4.9500000000000004e-05,
"loss": 0.3605,
"step": 106
},
{
"epoch": 1.0,
"eval_LOCATION_f1": 0.8333333333333333,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.8,
"eval_LOCATION_recall": 0.8695652173913043,
"eval_ORGANIZATION_f1": 0.696969696969697,
"eval_ORGANIZATION_number": 58,
"eval_ORGANIZATION_precision": 0.6216216216216216,
"eval_ORGANIZATION_recall": 0.7931034482758621,
"eval_PERSON_f1": 0.8670886075949367,
"eval_PERSON_number": 152,
"eval_PERSON_precision": 0.8353658536585366,
"eval_PERSON_recall": 0.9013157894736842,
"eval_QUANTITY_f1": 0.71875,
"eval_QUANTITY_number": 30,
"eval_QUANTITY_precision": 0.6764705882352942,
"eval_QUANTITY_recall": 0.7666666666666667,
"eval_TIME_f1": 0.8852459016393444,
"eval_TIME_number": 29,
"eval_TIME_precision": 0.84375,
"eval_TIME_recall": 0.9310344827586207,
"eval_loss": 0.14203932881355286,
"eval_overall_accuracy": 0.9562099871959027,
"eval_overall_f1": 0.8172942817294282,
"eval_overall_precision": 0.7730870712401056,
"eval_overall_recall": 0.8668639053254438,
"eval_runtime": 0.3189,
"eval_samples_per_second": 586.358,
"eval_steps_per_second": 9.407,
"step": 106
},
{
"epoch": 2.0,
"grad_norm": 2.4212687015533447,
"learning_rate": 4.9e-05,
"loss": 0.1203,
"step": 212
},
{
"epoch": 2.0,
"eval_LOCATION_f1": 0.8266666666666668,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7654320987654321,
"eval_LOCATION_recall": 0.8985507246376812,
"eval_ORGANIZATION_f1": 0.6917293233082706,
"eval_ORGANIZATION_number": 58,
"eval_ORGANIZATION_precision": 0.6133333333333333,
"eval_ORGANIZATION_recall": 0.7931034482758621,
"eval_PERSON_f1": 0.8867924528301887,
"eval_PERSON_number": 152,
"eval_PERSON_precision": 0.8493975903614458,
"eval_PERSON_recall": 0.9276315789473685,
"eval_QUANTITY_f1": 0.6865671641791045,
"eval_QUANTITY_number": 30,
"eval_QUANTITY_precision": 0.6216216216216216,
"eval_QUANTITY_recall": 0.7666666666666667,
"eval_TIME_f1": 0.75,
"eval_TIME_number": 29,
"eval_TIME_precision": 0.6857142857142857,
"eval_TIME_recall": 0.8275862068965517,
"eval_loss": 0.14541447162628174,
"eval_overall_accuracy": 0.9556978233034571,
"eval_overall_f1": 0.8087431693989071,
"eval_overall_precision": 0.751269035532995,
"eval_overall_recall": 0.8757396449704142,
"eval_runtime": 0.3201,
"eval_samples_per_second": 584.228,
"eval_steps_per_second": 9.373,
"step": 212
},
{
"epoch": 3.0,
"grad_norm": 5.2256245613098145,
"learning_rate": 4.85e-05,
"loss": 0.0755,
"step": 318
},
{
"epoch": 3.0,
"eval_LOCATION_f1": 0.8609271523178808,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7926829268292683,
"eval_LOCATION_recall": 0.9420289855072463,
"eval_ORGANIZATION_f1": 0.71875,
"eval_ORGANIZATION_number": 58,
"eval_ORGANIZATION_precision": 0.6571428571428571,
"eval_ORGANIZATION_recall": 0.7931034482758621,
"eval_PERSON_f1": 0.8571428571428571,
"eval_PERSON_number": 152,
"eval_PERSON_precision": 0.8117647058823529,
"eval_PERSON_recall": 0.9078947368421053,
"eval_QUANTITY_f1": 0.78125,
"eval_QUANTITY_number": 30,
"eval_QUANTITY_precision": 0.7352941176470589,
"eval_QUANTITY_recall": 0.8333333333333334,
"eval_TIME_f1": 0.8852459016393444,
"eval_TIME_number": 29,
"eval_TIME_precision": 0.84375,
"eval_TIME_recall": 0.9310344827586207,
"eval_loss": 0.14322705566883087,
"eval_overall_accuracy": 0.9613316261203585,
"eval_overall_f1": 0.8292011019283746,
"eval_overall_precision": 0.7757731958762887,
"eval_overall_recall": 0.8905325443786982,
"eval_runtime": 0.3175,
"eval_samples_per_second": 588.914,
"eval_steps_per_second": 9.448,
"step": 318
},
{
"epoch": 4.0,
"grad_norm": 1.6368614435195923,
"learning_rate": 4.8e-05,
"loss": 0.0504,
"step": 424
},
{
"epoch": 4.0,
"eval_LOCATION_f1": 0.8456375838926175,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7875,
"eval_LOCATION_recall": 0.9130434782608695,
"eval_ORGANIZATION_f1": 0.6495726495726496,
"eval_ORGANIZATION_number": 58,
"eval_ORGANIZATION_precision": 0.6440677966101694,
"eval_ORGANIZATION_recall": 0.6551724137931034,
"eval_PERSON_f1": 0.8734177215189874,
"eval_PERSON_number": 152,
"eval_PERSON_precision": 0.8414634146341463,
"eval_PERSON_recall": 0.9078947368421053,
"eval_QUANTITY_f1": 0.8387096774193549,
"eval_QUANTITY_number": 30,
"eval_QUANTITY_precision": 0.8125,
"eval_QUANTITY_recall": 0.8666666666666667,
"eval_TIME_f1": 0.7761194029850746,
"eval_TIME_number": 29,
"eval_TIME_precision": 0.6842105263157895,
"eval_TIME_recall": 0.896551724137931,
"eval_loss": 0.14780984818935394,
"eval_overall_accuracy": 0.9597951344430218,
"eval_overall_f1": 0.8185654008438817,
"eval_overall_precision": 0.7801608579088471,
"eval_overall_recall": 0.8609467455621301,
"eval_runtime": 0.3217,
"eval_samples_per_second": 581.313,
"eval_steps_per_second": 9.326,
"step": 424
},
{
"epoch": 5.0,
"grad_norm": 2.231923818588257,
"learning_rate": 4.75e-05,
"loss": 0.0318,
"step": 530
},
{
"epoch": 5.0,
"eval_LOCATION_f1": 0.8472222222222223,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.8133333333333334,
"eval_LOCATION_recall": 0.8840579710144928,
"eval_ORGANIZATION_f1": 0.7555555555555555,
"eval_ORGANIZATION_number": 58,
"eval_ORGANIZATION_precision": 0.6623376623376623,
"eval_ORGANIZATION_recall": 0.8793103448275862,
"eval_PERSON_f1": 0.9079365079365079,
"eval_PERSON_number": 152,
"eval_PERSON_precision": 0.8773006134969326,
"eval_PERSON_recall": 0.9407894736842105,
"eval_QUANTITY_f1": 0.7761194029850748,
"eval_QUANTITY_number": 30,
"eval_QUANTITY_precision": 0.7027027027027027,
"eval_QUANTITY_recall": 0.8666666666666667,
"eval_TIME_f1": 0.8666666666666666,
"eval_TIME_number": 29,
"eval_TIME_precision": 0.8387096774193549,
"eval_TIME_recall": 0.896551724137931,
"eval_loss": 0.18356788158416748,
"eval_overall_accuracy": 0.9597951344430218,
"eval_overall_f1": 0.8515950069348128,
"eval_overall_precision": 0.8015665796344648,
"eval_overall_recall": 0.908284023668639,
"eval_runtime": 0.3175,
"eval_samples_per_second": 588.92,
"eval_steps_per_second": 9.448,
"step": 530
},
{
"epoch": 6.0,
"grad_norm": 4.4022064208984375,
"learning_rate": 4.7e-05,
"loss": 0.0239,
"step": 636
},
{
"epoch": 6.0,
"eval_LOCATION_f1": 0.8450704225352113,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.821917808219178,
"eval_LOCATION_recall": 0.8695652173913043,
"eval_ORGANIZATION_f1": 0.7014925373134329,
"eval_ORGANIZATION_number": 58,
"eval_ORGANIZATION_precision": 0.618421052631579,
"eval_ORGANIZATION_recall": 0.8103448275862069,
"eval_PERSON_f1": 0.8478964401294499,
"eval_PERSON_number": 152,
"eval_PERSON_precision": 0.8343949044585988,
"eval_PERSON_recall": 0.8618421052631579,
"eval_QUANTITY_f1": 0.819672131147541,
"eval_QUANTITY_number": 30,
"eval_QUANTITY_precision": 0.8064516129032258,
"eval_QUANTITY_recall": 0.8333333333333334,
"eval_TIME_f1": 0.8524590163934426,
"eval_TIME_number": 29,
"eval_TIME_precision": 0.8125,
"eval_TIME_recall": 0.896551724137931,
"eval_loss": 0.1694508045911789,
"eval_overall_accuracy": 0.9577464788732394,
"eval_overall_f1": 0.8175388967468176,
"eval_overall_precision": 0.7831978319783198,
"eval_overall_recall": 0.8550295857988166,
"eval_runtime": 0.3257,
"eval_samples_per_second": 574.211,
"eval_steps_per_second": 9.212,
"step": 636
},
{
"epoch": 7.0,
"grad_norm": 0.2985347509384155,
"learning_rate": 4.6500000000000005e-05,
"loss": 0.0238,
"step": 742
},
{
"epoch": 7.0,
"eval_LOCATION_f1": 0.853146853146853,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.8243243243243243,
"eval_LOCATION_recall": 0.8840579710144928,
"eval_ORGANIZATION_f1": 0.75,
"eval_ORGANIZATION_number": 58,
"eval_ORGANIZATION_precision": 0.6857142857142857,
"eval_ORGANIZATION_recall": 0.8275862068965517,
"eval_PERSON_f1": 0.8616352201257862,
"eval_PERSON_number": 152,
"eval_PERSON_precision": 0.8253012048192772,
"eval_PERSON_recall": 0.9013157894736842,
"eval_QUANTITY_f1": 0.7352941176470588,
"eval_QUANTITY_number": 30,
"eval_QUANTITY_precision": 0.6578947368421053,
"eval_QUANTITY_recall": 0.8333333333333334,
"eval_TIME_f1": 0.8333333333333334,
"eval_TIME_number": 29,
"eval_TIME_precision": 0.8064516129032258,
"eval_TIME_recall": 0.8620689655172413,
"eval_loss": 0.19530388712882996,
"eval_overall_accuracy": 0.9608194622279129,
"eval_overall_f1": 0.8256624825662484,
"eval_overall_precision": 0.7810026385224275,
"eval_overall_recall": 0.8757396449704142,
"eval_runtime": 0.3219,
"eval_samples_per_second": 580.938,
"eval_steps_per_second": 9.32,
"step": 742
},
{
"epoch": 8.0,
"grad_norm": 0.04798915982246399,
"learning_rate": 4.600000000000001e-05,
"loss": 0.0134,
"step": 848
},
{
"epoch": 8.0,
"eval_LOCATION_f1": 0.8435374149659864,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7948717948717948,
"eval_LOCATION_recall": 0.8985507246376812,
"eval_ORGANIZATION_f1": 0.768,
"eval_ORGANIZATION_number": 58,
"eval_ORGANIZATION_precision": 0.7164179104477612,
"eval_ORGANIZATION_recall": 0.8275862068965517,
"eval_PERSON_f1": 0.8652037617554859,
"eval_PERSON_number": 152,
"eval_PERSON_precision": 0.8263473053892215,
"eval_PERSON_recall": 0.9078947368421053,
"eval_QUANTITY_f1": 0.7936507936507938,
"eval_QUANTITY_number": 30,
"eval_QUANTITY_precision": 0.7575757575757576,
"eval_QUANTITY_recall": 0.8333333333333334,
"eval_TIME_f1": 0.8813559322033899,
"eval_TIME_number": 29,
"eval_TIME_precision": 0.8666666666666667,
"eval_TIME_recall": 0.896551724137931,
"eval_loss": 0.23003453016281128,
"eval_overall_accuracy": 0.9633802816901409,
"eval_overall_f1": 0.8387096774193548,
"eval_overall_precision": 0.7973333333333333,
"eval_overall_recall": 0.8846153846153846,
"eval_runtime": 0.3389,
"eval_samples_per_second": 551.794,
"eval_steps_per_second": 8.852,
"step": 848
},
{
"epoch": 9.0,
"grad_norm": 0.5828952789306641,
"learning_rate": 4.55e-05,
"loss": 0.0097,
"step": 954
},
{
"epoch": 9.0,
"eval_LOCATION_f1": 0.8356164383561644,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7922077922077922,
"eval_LOCATION_recall": 0.8840579710144928,
"eval_ORGANIZATION_f1": 0.7401574803149606,
"eval_ORGANIZATION_number": 58,
"eval_ORGANIZATION_precision": 0.6811594202898551,
"eval_ORGANIZATION_recall": 0.8103448275862069,
"eval_PERSON_f1": 0.8859934853420195,
"eval_PERSON_number": 152,
"eval_PERSON_precision": 0.8774193548387097,
"eval_PERSON_recall": 0.8947368421052632,
"eval_QUANTITY_f1": 0.78125,
"eval_QUANTITY_number": 30,
"eval_QUANTITY_precision": 0.7352941176470589,
"eval_QUANTITY_recall": 0.8333333333333334,
"eval_TIME_f1": 0.896551724137931,
"eval_TIME_number": 29,
"eval_TIME_precision": 0.896551724137931,
"eval_TIME_recall": 0.896551724137931,
"eval_loss": 0.23057876527309418,
"eval_overall_accuracy": 0.9580025608194622,
"eval_overall_f1": 0.8404558404558404,
"eval_overall_precision": 0.8104395604395604,
"eval_overall_recall": 0.8727810650887574,
"eval_runtime": 0.3211,
"eval_samples_per_second": 582.432,
"eval_steps_per_second": 9.344,
"step": 954
},
{
"epoch": 10.0,
"grad_norm": 0.18654245138168335,
"learning_rate": 4.5e-05,
"loss": 0.0078,
"step": 1060
},
{
"epoch": 10.0,
"eval_LOCATION_f1": 0.8571428571428572,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.8076923076923077,
"eval_LOCATION_recall": 0.9130434782608695,
"eval_ORGANIZATION_f1": 0.7906976744186047,
"eval_ORGANIZATION_number": 58,
"eval_ORGANIZATION_precision": 0.7183098591549296,
"eval_ORGANIZATION_recall": 0.8793103448275862,
"eval_PERSON_f1": 0.8753993610223643,
"eval_PERSON_number": 152,
"eval_PERSON_precision": 0.8509316770186336,
"eval_PERSON_recall": 0.9013157894736842,
"eval_QUANTITY_f1": 0.78125,
"eval_QUANTITY_number": 30,
"eval_QUANTITY_precision": 0.7352941176470589,
"eval_QUANTITY_recall": 0.8333333333333334,
"eval_TIME_f1": 0.896551724137931,
"eval_TIME_number": 29,
"eval_TIME_precision": 0.896551724137931,
"eval_TIME_recall": 0.896551724137931,
"eval_loss": 0.2440958321094513,
"eval_overall_accuracy": 0.9664532650448143,
"eval_overall_f1": 0.849507735583685,
"eval_overall_precision": 0.8096514745308311,
"eval_overall_recall": 0.893491124260355,
"eval_runtime": 0.3238,
"eval_samples_per_second": 577.519,
"eval_steps_per_second": 9.265,
"step": 1060
},
{
"epoch": 11.0,
"grad_norm": 0.014143639244139194,
"learning_rate": 4.4500000000000004e-05,
"loss": 0.0057,
"step": 1166
},
{
"epoch": 11.0,
"eval_LOCATION_f1": 0.8571428571428572,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.8076923076923077,
"eval_LOCATION_recall": 0.9130434782608695,
"eval_ORGANIZATION_f1": 0.6440677966101694,
"eval_ORGANIZATION_number": 58,
"eval_ORGANIZATION_precision": 0.6333333333333333,
"eval_ORGANIZATION_recall": 0.6551724137931034,
"eval_PERSON_f1": 0.8838709677419354,
"eval_PERSON_number": 152,
"eval_PERSON_precision": 0.8670886075949367,
"eval_PERSON_recall": 0.9013157894736842,
"eval_QUANTITY_f1": 0.8387096774193549,
"eval_QUANTITY_number": 30,
"eval_QUANTITY_precision": 0.8125,
"eval_QUANTITY_recall": 0.8666666666666667,
"eval_TIME_f1": 0.8524590163934426,
"eval_TIME_number": 29,
"eval_TIME_precision": 0.8125,
"eval_TIME_recall": 0.896551724137931,
"eval_loss": 0.2606862783432007,
"eval_overall_accuracy": 0.9613316261203585,
"eval_overall_f1": 0.8309455587392551,
"eval_overall_precision": 0.8055555555555556,
"eval_overall_recall": 0.8579881656804734,
"eval_runtime": 0.32,
"eval_samples_per_second": 584.447,
"eval_steps_per_second": 9.376,
"step": 1166
},
{
"epoch": 12.0,
"grad_norm": 0.8590062260627747,
"learning_rate": 4.4000000000000006e-05,
"loss": 0.0057,
"step": 1272
},
{
"epoch": 12.0,
"eval_LOCATION_f1": 0.8368794326241135,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.8194444444444444,
"eval_LOCATION_recall": 0.855072463768116,
"eval_ORGANIZATION_f1": 0.7627118644067795,
"eval_ORGANIZATION_number": 58,
"eval_ORGANIZATION_precision": 0.75,
"eval_ORGANIZATION_recall": 0.7758620689655172,
"eval_PERSON_f1": 0.8706624605678233,
"eval_PERSON_number": 152,
"eval_PERSON_precision": 0.8363636363636363,
"eval_PERSON_recall": 0.9078947368421053,
"eval_QUANTITY_f1": 0.8064516129032259,
"eval_QUANTITY_number": 30,
"eval_QUANTITY_precision": 0.78125,
"eval_QUANTITY_recall": 0.8333333333333334,
"eval_TIME_f1": 0.8620689655172413,
"eval_TIME_number": 29,
"eval_TIME_precision": 0.8620689655172413,
"eval_TIME_recall": 0.8620689655172413,
"eval_loss": 0.2562354505062103,
"eval_overall_accuracy": 0.9623559539052496,
"eval_overall_f1": 0.8390804597701149,
"eval_overall_precision": 0.8156424581005587,
"eval_overall_recall": 0.863905325443787,
"eval_runtime": 0.3245,
"eval_samples_per_second": 576.335,
"eval_steps_per_second": 9.246,
"step": 1272
},
{
"epoch": 13.0,
"grad_norm": 0.005929162725806236,
"learning_rate": 4.35e-05,
"loss": 0.0041,
"step": 1378
},
{
"epoch": 13.0,
"eval_LOCATION_f1": 0.8724832214765101,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.8125,
"eval_LOCATION_recall": 0.9420289855072463,
"eval_ORGANIZATION_f1": 0.7768595041322314,
"eval_ORGANIZATION_number": 58,
"eval_ORGANIZATION_precision": 0.746031746031746,
"eval_ORGANIZATION_recall": 0.8103448275862069,
"eval_PERSON_f1": 0.8690095846645369,
"eval_PERSON_number": 152,
"eval_PERSON_precision": 0.84472049689441,
"eval_PERSON_recall": 0.8947368421052632,
"eval_QUANTITY_f1": 0.819672131147541,
"eval_QUANTITY_number": 30,
"eval_QUANTITY_precision": 0.8064516129032258,
"eval_QUANTITY_recall": 0.8333333333333334,
"eval_TIME_f1": 0.8813559322033899,
"eval_TIME_number": 29,
"eval_TIME_precision": 0.8666666666666667,
"eval_TIME_recall": 0.896551724137931,
"eval_loss": 0.26208436489105225,
"eval_overall_accuracy": 0.964404609475032,
"eval_overall_f1": 0.8506401137980085,
"eval_overall_precision": 0.8191780821917808,
"eval_overall_recall": 0.8846153846153846,
"eval_runtime": 0.3219,
"eval_samples_per_second": 580.969,
"eval_steps_per_second": 9.32,
"step": 1378
},
{
"epoch": 14.0,
"grad_norm": 0.20337995886802673,
"learning_rate": 4.3e-05,
"loss": 0.0045,
"step": 1484
},
{
"epoch": 14.0,
"eval_LOCATION_f1": 0.8311688311688311,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7529411764705882,
"eval_LOCATION_recall": 0.927536231884058,
"eval_ORGANIZATION_f1": 0.7241379310344829,
"eval_ORGANIZATION_number": 58,
"eval_ORGANIZATION_precision": 0.7241379310344828,
"eval_ORGANIZATION_recall": 0.7241379310344828,
"eval_PERSON_f1": 0.8717948717948718,
"eval_PERSON_number": 152,
"eval_PERSON_precision": 0.85,
"eval_PERSON_recall": 0.8947368421052632,
"eval_QUANTITY_f1": 0.8253968253968254,
"eval_QUANTITY_number": 30,
"eval_QUANTITY_precision": 0.7878787878787878,
"eval_QUANTITY_recall": 0.8666666666666667,
"eval_TIME_f1": 0.8253968253968255,
"eval_TIME_number": 29,
"eval_TIME_precision": 0.7647058823529411,
"eval_TIME_recall": 0.896551724137931,
"eval_loss": 0.2810960114002228,
"eval_overall_accuracy": 0.9633802816901409,
"eval_overall_f1": 0.8305084745762711,
"eval_overall_precision": 0.7945945945945946,
"eval_overall_recall": 0.8698224852071006,
"eval_runtime": 0.3298,
"eval_samples_per_second": 566.967,
"eval_steps_per_second": 9.096,
"step": 1484
},
{
"epoch": 15.0,
"grad_norm": 1.0766212940216064,
"learning_rate": 4.25e-05,
"loss": 0.0048,
"step": 1590
},
{
"epoch": 15.0,
"eval_LOCATION_f1": 0.8666666666666666,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.8024691358024691,
"eval_LOCATION_recall": 0.9420289855072463,
"eval_ORGANIZATION_f1": 0.7642276422764227,
"eval_ORGANIZATION_number": 58,
"eval_ORGANIZATION_precision": 0.7230769230769231,
"eval_ORGANIZATION_recall": 0.8103448275862069,
"eval_PERSON_f1": 0.8881789137380192,
"eval_PERSON_number": 152,
"eval_PERSON_precision": 0.8633540372670807,
"eval_PERSON_recall": 0.9144736842105263,
"eval_QUANTITY_f1": 0.8125,
"eval_QUANTITY_number": 30,
"eval_QUANTITY_precision": 0.7647058823529411,
"eval_QUANTITY_recall": 0.8666666666666667,
"eval_TIME_f1": 0.8666666666666666,
"eval_TIME_number": 29,
"eval_TIME_precision": 0.8387096774193549,
"eval_TIME_recall": 0.896551724137931,
"eval_loss": 0.26082485914230347,
"eval_overall_accuracy": 0.9626120358514725,
"eval_overall_f1": 0.8535211267605635,
"eval_overall_precision": 0.8145161290322581,
"eval_overall_recall": 0.8964497041420119,
"eval_runtime": 0.3242,
"eval_samples_per_second": 576.835,
"eval_steps_per_second": 9.254,
"step": 1590
},
{
"epoch": 16.0,
"grad_norm": 0.31145572662353516,
"learning_rate": 4.2e-05,
"loss": 0.0054,
"step": 1696
},
{
"epoch": 16.0,
"eval_LOCATION_f1": 0.8591549295774648,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.8356164383561644,
"eval_LOCATION_recall": 0.8840579710144928,
"eval_ORGANIZATION_f1": 0.7441860465116279,
"eval_ORGANIZATION_number": 58,
"eval_ORGANIZATION_precision": 0.676056338028169,
"eval_ORGANIZATION_recall": 0.8275862068965517,
"eval_PERSON_f1": 0.8980891719745223,
"eval_PERSON_number": 152,
"eval_PERSON_precision": 0.8703703703703703,
"eval_PERSON_recall": 0.9276315789473685,
"eval_QUANTITY_f1": 0.8387096774193549,
"eval_QUANTITY_number": 30,
"eval_QUANTITY_precision": 0.8125,
"eval_QUANTITY_recall": 0.8666666666666667,
"eval_TIME_f1": 0.8771929824561403,
"eval_TIME_number": 29,
"eval_TIME_precision": 0.8928571428571429,
"eval_TIME_recall": 0.8620689655172413,
"eval_loss": 0.26623842120170593,
"eval_overall_accuracy": 0.9608194622279129,
"eval_overall_f1": 0.8551136363636364,
"eval_overall_precision": 0.8224043715846995,
"eval_overall_recall": 0.8905325443786982,
"eval_runtime": 0.3327,
"eval_samples_per_second": 562.013,
"eval_steps_per_second": 9.016,
"step": 1696
},
{
"epoch": 17.0,
"grad_norm": 0.1136045828461647,
"learning_rate": 4.15e-05,
"loss": 0.0048,
"step": 1802
},
{
"epoch": 17.0,
"eval_LOCATION_f1": 0.8666666666666666,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.8024691358024691,
"eval_LOCATION_recall": 0.9420289855072463,
"eval_ORGANIZATION_f1": 0.7301587301587301,
"eval_ORGANIZATION_number": 58,
"eval_ORGANIZATION_precision": 0.6764705882352942,
"eval_ORGANIZATION_recall": 0.7931034482758621,
"eval_PERSON_f1": 0.8673139158576052,
"eval_PERSON_number": 152,
"eval_PERSON_precision": 0.8535031847133758,
"eval_PERSON_recall": 0.881578947368421,
"eval_QUANTITY_f1": 0.7936507936507938,
"eval_QUANTITY_number": 30,
"eval_QUANTITY_precision": 0.7575757575757576,
"eval_QUANTITY_recall": 0.8333333333333334,
"eval_TIME_f1": 0.7575757575757576,
"eval_TIME_number": 29,
"eval_TIME_precision": 0.6756756756756757,
"eval_TIME_recall": 0.8620689655172413,
"eval_loss": 0.28109654784202576,
"eval_overall_accuracy": 0.9613316261203585,
"eval_overall_f1": 0.8263305322128851,
"eval_overall_precision": 0.7845744680851063,
"eval_overall_recall": 0.8727810650887574,
"eval_runtime": 0.3218,
"eval_samples_per_second": 581.076,
"eval_steps_per_second": 9.322,
"step": 1802
},
{
"epoch": 18.0,
"grad_norm": 0.021722104400396347,
"learning_rate": 4.1e-05,
"loss": 0.0039,
"step": 1908
},
{
"epoch": 18.0,
"eval_LOCATION_f1": 0.8591549295774648,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.8356164383561644,
"eval_LOCATION_recall": 0.8840579710144928,
"eval_ORGANIZATION_f1": 0.7692307692307692,
"eval_ORGANIZATION_number": 58,
"eval_ORGANIZATION_precision": 0.6944444444444444,
"eval_ORGANIZATION_recall": 0.8620689655172413,
"eval_PERSON_f1": 0.8375,
"eval_PERSON_number": 152,
"eval_PERSON_precision": 0.7976190476190477,
"eval_PERSON_recall": 0.881578947368421,
"eval_QUANTITY_f1": 0.78125,
"eval_QUANTITY_number": 30,
"eval_QUANTITY_precision": 0.7352941176470589,
"eval_QUANTITY_recall": 0.8333333333333334,
"eval_TIME_f1": 0.8064516129032258,
"eval_TIME_number": 29,
"eval_TIME_precision": 0.7575757575757576,
"eval_TIME_recall": 0.8620689655172413,
"eval_loss": 0.29267749190330505,
"eval_overall_accuracy": 0.9574903969270167,
"eval_overall_f1": 0.8217270194986072,
"eval_overall_precision": 0.7763157894736842,
"eval_overall_recall": 0.8727810650887574,
"eval_runtime": 0.3291,
"eval_samples_per_second": 568.172,
"eval_steps_per_second": 9.115,
"step": 1908
},
{
"epoch": 19.0,
"grad_norm": 0.02122313901782036,
"learning_rate": 4.05e-05,
"loss": 0.0038,
"step": 2014
},
{
"epoch": 19.0,
"eval_LOCATION_f1": 0.8767123287671235,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.8311688311688312,
"eval_LOCATION_recall": 0.927536231884058,
"eval_ORGANIZATION_f1": 0.6666666666666667,
"eval_ORGANIZATION_number": 58,
"eval_ORGANIZATION_precision": 0.6176470588235294,
"eval_ORGANIZATION_recall": 0.7241379310344828,
"eval_PERSON_f1": 0.8974358974358975,
"eval_PERSON_number": 152,
"eval_PERSON_precision": 0.875,
"eval_PERSON_recall": 0.9210526315789473,
"eval_QUANTITY_f1": 0.8064516129032259,
"eval_QUANTITY_number": 30,
"eval_QUANTITY_precision": 0.78125,
"eval_QUANTITY_recall": 0.8333333333333334,
"eval_TIME_f1": 0.8524590163934426,
"eval_TIME_number": 29,
"eval_TIME_precision": 0.8125,
"eval_TIME_recall": 0.896551724137931,
"eval_loss": 0.2553775906562805,
"eval_overall_accuracy": 0.9633802816901409,
"eval_overall_f1": 0.8401697312588403,
"eval_overall_precision": 0.8048780487804879,
"eval_overall_recall": 0.878698224852071,
"eval_runtime": 0.3254,
"eval_samples_per_second": 574.754,
"eval_steps_per_second": 9.221,
"step": 2014
},
{
"epoch": 20.0,
"grad_norm": 0.002756689442321658,
"learning_rate": 4e-05,
"loss": 0.0044,
"step": 2120
},
{
"epoch": 20.0,
"eval_LOCATION_f1": 0.8289473684210527,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7590361445783133,
"eval_LOCATION_recall": 0.9130434782608695,
"eval_ORGANIZATION_f1": 0.7107438016528926,
"eval_ORGANIZATION_number": 58,
"eval_ORGANIZATION_precision": 0.6825396825396826,
"eval_ORGANIZATION_recall": 0.7413793103448276,
"eval_PERSON_f1": 0.896774193548387,
"eval_PERSON_number": 152,
"eval_PERSON_precision": 0.879746835443038,
"eval_PERSON_recall": 0.9144736842105263,
"eval_QUANTITY_f1": 0.8125,
"eval_QUANTITY_number": 30,
"eval_QUANTITY_precision": 0.7647058823529411,
"eval_QUANTITY_recall": 0.8666666666666667,
"eval_TIME_f1": 0.8253968253968255,
"eval_TIME_number": 29,
"eval_TIME_precision": 0.7647058823529411,
"eval_TIME_recall": 0.896551724137931,
"eval_loss": 0.2622649371623993,
"eval_overall_accuracy": 0.9620998719590269,
"eval_overall_f1": 0.8366197183098592,
"eval_overall_precision": 0.7983870967741935,
"eval_overall_recall": 0.878698224852071,
"eval_runtime": 0.3319,
"eval_samples_per_second": 563.374,
"eval_steps_per_second": 9.038,
"step": 2120
},
{
"epoch": 21.0,
"grad_norm": 0.012515822425484657,
"learning_rate": 3.9500000000000005e-05,
"loss": 0.0033,
"step": 2226
},
{
"epoch": 21.0,
"eval_LOCATION_f1": 0.8513513513513514,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7974683544303798,
"eval_LOCATION_recall": 0.9130434782608695,
"eval_ORGANIZATION_f1": 0.735042735042735,
"eval_ORGANIZATION_number": 58,
"eval_ORGANIZATION_precision": 0.7288135593220338,
"eval_ORGANIZATION_recall": 0.7413793103448276,
"eval_PERSON_f1": 0.8853503184713376,
"eval_PERSON_number": 152,
"eval_PERSON_precision": 0.8580246913580247,
"eval_PERSON_recall": 0.9144736842105263,
"eval_QUANTITY_f1": 0.7878787878787877,
"eval_QUANTITY_number": 30,
"eval_QUANTITY_precision": 0.7222222222222222,
"eval_QUANTITY_recall": 0.8666666666666667,
"eval_TIME_f1": 0.8333333333333334,
"eval_TIME_number": 29,
"eval_TIME_precision": 0.8064516129032258,
"eval_TIME_recall": 0.8620689655172413,
"eval_loss": 0.27664482593536377,
"eval_overall_accuracy": 0.9600512163892445,
"eval_overall_f1": 0.8397163120567377,
"eval_overall_precision": 0.8065395095367848,
"eval_overall_recall": 0.8757396449704142,
"eval_runtime": 0.3226,
"eval_samples_per_second": 579.696,
"eval_steps_per_second": 9.3,
"step": 2226
},
{
"epoch": 22.0,
"grad_norm": 0.001122328918427229,
"learning_rate": 3.9000000000000006e-05,
"loss": 0.0048,
"step": 2332
},
{
"epoch": 22.0,
"eval_LOCATION_f1": 0.8904109589041096,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.8441558441558441,
"eval_LOCATION_recall": 0.9420289855072463,
"eval_ORGANIZATION_f1": 0.7727272727272727,
"eval_ORGANIZATION_number": 58,
"eval_ORGANIZATION_precision": 0.6891891891891891,
"eval_ORGANIZATION_recall": 0.8793103448275862,
"eval_PERSON_f1": 0.8974358974358975,
"eval_PERSON_number": 152,
"eval_PERSON_precision": 0.875,
"eval_PERSON_recall": 0.9210526315789473,
"eval_QUANTITY_f1": 0.8253968253968254,
"eval_QUANTITY_number": 30,
"eval_QUANTITY_precision": 0.7878787878787878,
"eval_QUANTITY_recall": 0.8666666666666667,
"eval_TIME_f1": 0.8813559322033899,
"eval_TIME_number": 29,
"eval_TIME_precision": 0.8666666666666667,
"eval_TIME_recall": 0.896551724137931,
"eval_loss": 0.26052865386009216,
"eval_overall_accuracy": 0.9651728553137003,
"eval_overall_f1": 0.8651685393258427,
"eval_overall_precision": 0.8235294117647058,
"eval_overall_recall": 0.9112426035502958,
"eval_runtime": 0.33,
"eval_samples_per_second": 566.654,
"eval_steps_per_second": 9.091,
"step": 2332
},
{
"epoch": 23.0,
"grad_norm": 0.01085362397134304,
"learning_rate": 3.85e-05,
"loss": 0.003,
"step": 2438
},
{
"epoch": 23.0,
"eval_LOCATION_f1": 0.8378378378378378,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7848101265822784,
"eval_LOCATION_recall": 0.8985507246376812,
"eval_ORGANIZATION_f1": 0.7727272727272727,
"eval_ORGANIZATION_number": 58,
"eval_ORGANIZATION_precision": 0.6891891891891891,
"eval_ORGANIZATION_recall": 0.8793103448275862,
"eval_PERSON_f1": 0.9032258064516129,
"eval_PERSON_number": 152,
"eval_PERSON_precision": 0.8860759493670886,
"eval_PERSON_recall": 0.9210526315789473,
"eval_QUANTITY_f1": 0.8387096774193549,
"eval_QUANTITY_number": 30,
"eval_QUANTITY_precision": 0.8125,
"eval_QUANTITY_recall": 0.8666666666666667,
"eval_TIME_f1": 0.8666666666666666,
"eval_TIME_number": 29,
"eval_TIME_precision": 0.8387096774193549,
"eval_TIME_recall": 0.896551724137931,
"eval_loss": 0.2736039459705353,
"eval_overall_accuracy": 0.9646606914212548,
"eval_overall_f1": 0.8567415730337079,
"eval_overall_precision": 0.8155080213903744,
"eval_overall_recall": 0.9023668639053254,
"eval_runtime": 0.3239,
"eval_samples_per_second": 577.377,
"eval_steps_per_second": 9.263,
"step": 2438
},
{
"epoch": 24.0,
"grad_norm": 0.02887049876153469,
"learning_rate": 3.8e-05,
"loss": 0.0024,
"step": 2544
},
{
"epoch": 24.0,
"eval_LOCATION_f1": 0.8666666666666666,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.8024691358024691,
"eval_LOCATION_recall": 0.9420289855072463,
"eval_ORGANIZATION_f1": 0.7244094488188977,
"eval_ORGANIZATION_number": 58,
"eval_ORGANIZATION_precision": 0.6666666666666666,
"eval_ORGANIZATION_recall": 0.7931034482758621,
"eval_PERSON_f1": 0.9090909090909091,
"eval_PERSON_number": 152,
"eval_PERSON_precision": 0.8974358974358975,
"eval_PERSON_recall": 0.9210526315789473,
"eval_QUANTITY_f1": 0.8125,
"eval_QUANTITY_number": 30,
"eval_QUANTITY_precision": 0.7647058823529411,
"eval_QUANTITY_recall": 0.8666666666666667,
"eval_TIME_f1": 0.8813559322033899,
"eval_TIME_number": 29,
"eval_TIME_precision": 0.8666666666666667,
"eval_TIME_recall": 0.896551724137931,
"eval_loss": 0.28270941972732544,
"eval_overall_accuracy": 0.9646606914212548,
"eval_overall_f1": 0.8559322033898306,
"eval_overall_precision": 0.8189189189189189,
"eval_overall_recall": 0.8964497041420119,
"eval_runtime": 0.3467,
"eval_samples_per_second": 539.396,
"eval_steps_per_second": 8.653,
"step": 2544
},
{
"epoch": 25.0,
"grad_norm": 0.0016468241810798645,
"learning_rate": 3.7500000000000003e-05,
"loss": 0.0024,
"step": 2650
},
{
"epoch": 25.0,
"eval_LOCATION_f1": 0.8648648648648648,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.810126582278481,
"eval_LOCATION_recall": 0.927536231884058,
"eval_ORGANIZATION_f1": 0.7681159420289855,
"eval_ORGANIZATION_number": 58,
"eval_ORGANIZATION_precision": 0.6625,
"eval_ORGANIZATION_recall": 0.9137931034482759,
"eval_PERSON_f1": 0.8980891719745223,
"eval_PERSON_number": 152,
"eval_PERSON_precision": 0.8703703703703703,
"eval_PERSON_recall": 0.9276315789473685,
"eval_QUANTITY_f1": 0.8125,
"eval_QUANTITY_number": 30,
"eval_QUANTITY_precision": 0.7647058823529411,
"eval_QUANTITY_recall": 0.8666666666666667,
"eval_TIME_f1": 0.896551724137931,
"eval_TIME_number": 29,
"eval_TIME_precision": 0.896551724137931,
"eval_TIME_recall": 0.896551724137931,
"eval_loss": 0.28754085302352905,
"eval_overall_accuracy": 0.9646606914212548,
"eval_overall_f1": 0.8587257617728532,
"eval_overall_precision": 0.8072916666666666,
"eval_overall_recall": 0.9171597633136095,
"eval_runtime": 0.3225,
"eval_samples_per_second": 579.871,
"eval_steps_per_second": 9.303,
"step": 2650
},
{
"epoch": 26.0,
"grad_norm": 0.22259019315242767,
"learning_rate": 3.7e-05,
"loss": 0.0025,
"step": 2756
},
{
"epoch": 26.0,
"eval_LOCATION_f1": 0.8378378378378378,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7848101265822784,
"eval_LOCATION_recall": 0.8985507246376812,
"eval_ORGANIZATION_f1": 0.728813559322034,
"eval_ORGANIZATION_number": 58,
"eval_ORGANIZATION_precision": 0.7166666666666667,
"eval_ORGANIZATION_recall": 0.7413793103448276,
"eval_PERSON_f1": 0.8924050632911392,
"eval_PERSON_number": 152,
"eval_PERSON_precision": 0.8597560975609756,
"eval_PERSON_recall": 0.9276315789473685,
"eval_QUANTITY_f1": 0.8387096774193549,
"eval_QUANTITY_number": 30,
"eval_QUANTITY_precision": 0.8125,
"eval_QUANTITY_recall": 0.8666666666666667,
"eval_TIME_f1": 0.8813559322033899,
"eval_TIME_number": 29,
"eval_TIME_precision": 0.8666666666666667,
"eval_TIME_recall": 0.896551724137931,
"eval_loss": 0.2877175509929657,
"eval_overall_accuracy": 0.9641485275288092,
"eval_overall_f1": 0.8477951635846374,
"eval_overall_precision": 0.8164383561643835,
"eval_overall_recall": 0.8816568047337278,
"eval_runtime": 0.3224,
"eval_samples_per_second": 580.076,
"eval_steps_per_second": 9.306,
"step": 2756
},
{
"epoch": 27.0,
"grad_norm": 0.013442899100482464,
"learning_rate": 3.65e-05,
"loss": 0.0038,
"step": 2862
},
{
"epoch": 27.0,
"eval_LOCATION_f1": 0.8289473684210527,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7590361445783133,
"eval_LOCATION_recall": 0.9130434782608695,
"eval_ORGANIZATION_f1": 0.6825396825396826,
"eval_ORGANIZATION_number": 58,
"eval_ORGANIZATION_precision": 0.6323529411764706,
"eval_ORGANIZATION_recall": 0.7413793103448276,
"eval_PERSON_f1": 0.9196141479099678,
"eval_PERSON_number": 152,
"eval_PERSON_precision": 0.89937106918239,
"eval_PERSON_recall": 0.9407894736842105,
"eval_QUANTITY_f1": 0.8,
"eval_QUANTITY_number": 30,
"eval_QUANTITY_precision": 0.7428571428571429,
"eval_QUANTITY_recall": 0.8666666666666667,
"eval_TIME_f1": 0.8387096774193549,
"eval_TIME_number": 29,
"eval_TIME_precision": 0.7878787878787878,
"eval_TIME_recall": 0.896551724137931,
"eval_loss": 0.29557737708091736,
"eval_overall_accuracy": 0.9610755441741358,
"eval_overall_f1": 0.840782122905028,
"eval_overall_precision": 0.7962962962962963,
"eval_overall_recall": 0.8905325443786982,
"eval_runtime": 0.3217,
"eval_samples_per_second": 581.31,
"eval_steps_per_second": 9.326,
"step": 2862
},
{
"epoch": 28.0,
"grad_norm": 0.033651720732450485,
"learning_rate": 3.6e-05,
"loss": 0.0046,
"step": 2968
},
{
"epoch": 28.0,
"eval_LOCATION_f1": 0.8609271523178808,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7926829268292683,
"eval_LOCATION_recall": 0.9420289855072463,
"eval_ORGANIZATION_f1": 0.7559055118110236,
"eval_ORGANIZATION_number": 58,
"eval_ORGANIZATION_precision": 0.6956521739130435,
"eval_ORGANIZATION_recall": 0.8275862068965517,
"eval_PERSON_f1": 0.9044585987261147,
"eval_PERSON_number": 152,
"eval_PERSON_precision": 0.8765432098765432,
"eval_PERSON_recall": 0.9342105263157895,
"eval_QUANTITY_f1": 0.8253968253968254,
"eval_QUANTITY_number": 30,
"eval_QUANTITY_precision": 0.7878787878787878,
"eval_QUANTITY_recall": 0.8666666666666667,
"eval_TIME_f1": 0.8813559322033899,
"eval_TIME_number": 29,
"eval_TIME_precision": 0.8666666666666667,
"eval_TIME_recall": 0.896551724137931,
"eval_loss": 0.2740738093852997,
"eval_overall_accuracy": 0.9649167733674776,
"eval_overall_f1": 0.8599439775910365,
"eval_overall_precision": 0.8164893617021277,
"eval_overall_recall": 0.908284023668639,
"eval_runtime": 0.3277,
"eval_samples_per_second": 570.688,
"eval_steps_per_second": 9.155,
"step": 2968
},
{
"epoch": 29.0,
"grad_norm": 0.0036596679128706455,
"learning_rate": 3.55e-05,
"loss": 0.0022,
"step": 3074
},
{
"epoch": 29.0,
"eval_LOCATION_f1": 0.8689655172413793,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.8289473684210527,
"eval_LOCATION_recall": 0.9130434782608695,
"eval_ORGANIZATION_f1": 0.7936507936507937,
"eval_ORGANIZATION_number": 58,
"eval_ORGANIZATION_precision": 0.7352941176470589,
"eval_ORGANIZATION_recall": 0.8620689655172413,
"eval_PERSON_f1": 0.9126213592233009,
"eval_PERSON_number": 152,
"eval_PERSON_precision": 0.8980891719745223,
"eval_PERSON_recall": 0.9276315789473685,
"eval_QUANTITY_f1": 0.8253968253968254,
"eval_QUANTITY_number": 30,
"eval_QUANTITY_precision": 0.7878787878787878,
"eval_QUANTITY_recall": 0.8666666666666667,
"eval_TIME_f1": 0.896551724137931,
"eval_TIME_number": 29,
"eval_TIME_precision": 0.896551724137931,
"eval_TIME_recall": 0.896551724137931,
"eval_loss": 0.280216246843338,
"eval_overall_accuracy": 0.9667093469910372,
"eval_overall_f1": 0.8730385164051355,
"eval_overall_precision": 0.8429752066115702,
"eval_overall_recall": 0.9053254437869822,
"eval_runtime": 0.3236,
"eval_samples_per_second": 577.801,
"eval_steps_per_second": 9.27,
"step": 3074
},
{
"epoch": 30.0,
"grad_norm": 0.09640705585479736,
"learning_rate": 3.5e-05,
"loss": 0.002,
"step": 3180
},
{
"epoch": 30.0,
"eval_LOCATION_f1": 0.8590604026845639,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.8,
"eval_LOCATION_recall": 0.927536231884058,
"eval_ORGANIZATION_f1": 0.7903225806451614,
"eval_ORGANIZATION_number": 58,
"eval_ORGANIZATION_precision": 0.7424242424242424,
"eval_ORGANIZATION_recall": 0.8448275862068966,
"eval_PERSON_f1": 0.9038461538461539,
"eval_PERSON_number": 152,
"eval_PERSON_precision": 0.88125,
"eval_PERSON_recall": 0.9276315789473685,
"eval_QUANTITY_f1": 0.8387096774193549,
"eval_QUANTITY_number": 30,
"eval_QUANTITY_precision": 0.8125,
"eval_QUANTITY_recall": 0.8666666666666667,
"eval_TIME_f1": 0.896551724137931,
"eval_TIME_number": 29,
"eval_TIME_precision": 0.896551724137931,
"eval_TIME_recall": 0.896551724137931,
"eval_loss": 0.29095637798309326,
"eval_overall_accuracy": 0.9674775928297055,
"eval_overall_f1": 0.8680851063829786,
"eval_overall_precision": 0.8337874659400545,
"eval_overall_recall": 0.9053254437869822,
"eval_runtime": 0.3288,
"eval_samples_per_second": 568.665,
"eval_steps_per_second": 9.123,
"step": 3180
},
{
"epoch": 31.0,
"grad_norm": 0.002530389465391636,
"learning_rate": 3.45e-05,
"loss": 0.0015,
"step": 3286
},
{
"epoch": 31.0,
"eval_LOCATION_f1": 0.8571428571428572,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.8076923076923077,
"eval_LOCATION_recall": 0.9130434782608695,
"eval_ORGANIZATION_f1": 0.768,
"eval_ORGANIZATION_number": 58,
"eval_ORGANIZATION_precision": 0.7164179104477612,
"eval_ORGANIZATION_recall": 0.8275862068965517,
"eval_PERSON_f1": 0.9049180327868853,
"eval_PERSON_number": 152,
"eval_PERSON_precision": 0.9019607843137255,
"eval_PERSON_recall": 0.9078947368421053,
"eval_QUANTITY_f1": 0.8387096774193549,
"eval_QUANTITY_number": 30,
"eval_QUANTITY_precision": 0.8125,
"eval_QUANTITY_recall": 0.8666666666666667,
"eval_TIME_f1": 0.896551724137931,
"eval_TIME_number": 29,
"eval_TIME_precision": 0.896551724137931,
"eval_TIME_recall": 0.896551724137931,
"eval_loss": 0.29163551330566406,
"eval_overall_accuracy": 0.9661971830985916,
"eval_overall_f1": 0.8637015781922526,
"eval_overall_precision": 0.8384401114206128,
"eval_overall_recall": 0.8905325443786982,
"eval_runtime": 0.3204,
"eval_samples_per_second": 583.719,
"eval_steps_per_second": 9.364,
"step": 3286
},
{
"epoch": 32.0,
"grad_norm": 0.03596256300806999,
"learning_rate": 3.4000000000000007e-05,
"loss": 0.004,
"step": 3392
},
{
"epoch": 32.0,
"eval_LOCATION_f1": 0.881118881118881,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.8513513513513513,
"eval_LOCATION_recall": 0.9130434782608695,
"eval_ORGANIZATION_f1": 0.7704918032786885,
"eval_ORGANIZATION_number": 58,
"eval_ORGANIZATION_precision": 0.734375,
"eval_ORGANIZATION_recall": 0.8103448275862069,
"eval_PERSON_f1": 0.9003215434083601,
"eval_PERSON_number": 152,
"eval_PERSON_precision": 0.8805031446540881,
"eval_PERSON_recall": 0.9210526315789473,
"eval_QUANTITY_f1": 0.8387096774193549,
"eval_QUANTITY_number": 30,
"eval_QUANTITY_precision": 0.8125,
"eval_QUANTITY_recall": 0.8666666666666667,
"eval_TIME_f1": 0.8135593220338982,
"eval_TIME_number": 29,
"eval_TIME_precision": 0.8,
"eval_TIME_recall": 0.8275862068965517,
"eval_loss": 0.285200834274292,
"eval_overall_accuracy": 0.9649167733674776,
"eval_overall_f1": 0.860832137733142,
"eval_overall_precision": 0.8356545961002786,
"eval_overall_recall": 0.8875739644970414,
"eval_runtime": 0.333,
"eval_samples_per_second": 561.561,
"eval_steps_per_second": 9.009,
"step": 3392
},
{
"epoch": 33.0,
"grad_norm": 0.008540854789316654,
"learning_rate": 3.35e-05,
"loss": 0.0038,
"step": 3498
},
{
"epoch": 33.0,
"eval_LOCATION_f1": 0.863013698630137,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.8181818181818182,
"eval_LOCATION_recall": 0.9130434782608695,
"eval_ORGANIZATION_f1": 0.8032786885245901,
"eval_ORGANIZATION_number": 58,
"eval_ORGANIZATION_precision": 0.765625,
"eval_ORGANIZATION_recall": 0.8448275862068966,
"eval_PERSON_f1": 0.9015873015873016,
"eval_PERSON_number": 152,
"eval_PERSON_precision": 0.8711656441717791,
"eval_PERSON_recall": 0.9342105263157895,
"eval_QUANTITY_f1": 0.8387096774193549,
"eval_QUANTITY_number": 30,
"eval_QUANTITY_precision": 0.8125,
"eval_QUANTITY_recall": 0.8666666666666667,
"eval_TIME_f1": 0.8196721311475409,
"eval_TIME_number": 29,
"eval_TIME_precision": 0.78125,
"eval_TIME_recall": 0.8620689655172413,
"eval_loss": 0.28712666034698486,
"eval_overall_accuracy": 0.9649167733674776,
"eval_overall_f1": 0.8640226628895185,
"eval_overall_precision": 0.8288043478260869,
"eval_overall_recall": 0.9023668639053254,
"eval_runtime": 0.3198,
"eval_samples_per_second": 584.775,
"eval_steps_per_second": 9.381,
"step": 3498
},
{
"epoch": 34.0,
"grad_norm": 0.0038193664513528347,
"learning_rate": 3.3e-05,
"loss": 0.0042,
"step": 3604
},
{
"epoch": 34.0,
"eval_LOCATION_f1": 0.8749999999999999,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.84,
"eval_LOCATION_recall": 0.9130434782608695,
"eval_ORGANIZATION_f1": 0.7272727272727273,
"eval_ORGANIZATION_number": 58,
"eval_ORGANIZATION_precision": 0.6486486486486487,
"eval_ORGANIZATION_recall": 0.8275862068965517,
"eval_PERSON_f1": 0.8996763754045308,
"eval_PERSON_number": 152,
"eval_PERSON_precision": 0.8853503184713376,
"eval_PERSON_recall": 0.9144736842105263,
"eval_QUANTITY_f1": 0.8387096774193549,
"eval_QUANTITY_number": 30,
"eval_QUANTITY_precision": 0.8125,
"eval_QUANTITY_recall": 0.8666666666666667,
"eval_TIME_f1": 0.8666666666666666,
"eval_TIME_number": 29,
"eval_TIME_precision": 0.8387096774193549,
"eval_TIME_recall": 0.896551724137931,
"eval_loss": 0.29013821482658386,
"eval_overall_accuracy": 0.9623559539052496,
"eval_overall_f1": 0.8543140028288543,
"eval_overall_precision": 0.8184281842818428,
"eval_overall_recall": 0.893491124260355,
"eval_runtime": 0.3361,
"eval_samples_per_second": 556.385,
"eval_steps_per_second": 8.926,
"step": 3604
},
{
"epoch": 35.0,
"grad_norm": 0.014040589332580566,
"learning_rate": 3.2500000000000004e-05,
"loss": 0.0026,
"step": 3710
},
{
"epoch": 35.0,
"eval_LOCATION_f1": 0.8533333333333333,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7901234567901234,
"eval_LOCATION_recall": 0.927536231884058,
"eval_ORGANIZATION_f1": 0.7936507936507937,
"eval_ORGANIZATION_number": 58,
"eval_ORGANIZATION_precision": 0.7352941176470589,
"eval_ORGANIZATION_recall": 0.8620689655172413,
"eval_PERSON_f1": 0.9161290322580645,
"eval_PERSON_number": 152,
"eval_PERSON_precision": 0.8987341772151899,
"eval_PERSON_recall": 0.9342105263157895,
"eval_QUANTITY_f1": 0.8387096774193549,
"eval_QUANTITY_number": 30,
"eval_QUANTITY_precision": 0.8125,
"eval_QUANTITY_recall": 0.8666666666666667,
"eval_TIME_f1": 0.8666666666666666,
"eval_TIME_number": 29,
"eval_TIME_precision": 0.8387096774193549,
"eval_TIME_recall": 0.896551724137931,
"eval_loss": 0.27812227606773376,
"eval_overall_accuracy": 0.9659411011523688,
"eval_overall_f1": 0.8700564971751412,
"eval_overall_precision": 0.8324324324324325,
"eval_overall_recall": 0.9112426035502958,
"eval_runtime": 0.3232,
"eval_samples_per_second": 578.539,
"eval_steps_per_second": 9.281,
"step": 3710
},
{
"epoch": 36.0,
"grad_norm": 0.0036135606933385134,
"learning_rate": 3.2000000000000005e-05,
"loss": 0.0021,
"step": 3816
},
{
"epoch": 36.0,
"eval_LOCATION_f1": 0.8551724137931034,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.8157894736842105,
"eval_LOCATION_recall": 0.8985507246376812,
"eval_ORGANIZATION_f1": 0.8091603053435115,
"eval_ORGANIZATION_number": 58,
"eval_ORGANIZATION_precision": 0.726027397260274,
"eval_ORGANIZATION_recall": 0.9137931034482759,
"eval_PERSON_f1": 0.9032258064516129,
"eval_PERSON_number": 152,
"eval_PERSON_precision": 0.8860759493670886,
"eval_PERSON_recall": 0.9210526315789473,
"eval_QUANTITY_f1": 0.8253968253968254,
"eval_QUANTITY_number": 30,
"eval_QUANTITY_precision": 0.7878787878787878,
"eval_QUANTITY_recall": 0.8666666666666667,
"eval_TIME_f1": 0.8771929824561403,
"eval_TIME_number": 29,
"eval_TIME_precision": 0.8928571428571429,
"eval_TIME_recall": 0.8620689655172413,
"eval_loss": 0.29289114475250244,
"eval_overall_accuracy": 0.9641485275288092,
"eval_overall_f1": 0.8668555240793201,
"eval_overall_precision": 0.8315217391304348,
"eval_overall_recall": 0.9053254437869822,
"eval_runtime": 0.3214,
"eval_samples_per_second": 581.814,
"eval_steps_per_second": 9.334,
"step": 3816
},
{
"epoch": 37.0,
"grad_norm": 0.047017503529787064,
"learning_rate": 3.15e-05,
"loss": 0.002,
"step": 3922
},
{
"epoch": 37.0,
"eval_LOCATION_f1": 0.84,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7777777777777778,
"eval_LOCATION_recall": 0.9130434782608695,
"eval_ORGANIZATION_f1": 0.7967479674796748,
"eval_ORGANIZATION_number": 58,
"eval_ORGANIZATION_precision": 0.7538461538461538,
"eval_ORGANIZATION_recall": 0.8448275862068966,
"eval_PERSON_f1": 0.9078947368421053,
"eval_PERSON_number": 152,
"eval_PERSON_precision": 0.9078947368421053,
"eval_PERSON_recall": 0.9078947368421053,
"eval_QUANTITY_f1": 0.8387096774193549,
"eval_QUANTITY_number": 30,
"eval_QUANTITY_precision": 0.8125,
"eval_QUANTITY_recall": 0.8666666666666667,
"eval_TIME_f1": 0.8333333333333334,
"eval_TIME_number": 29,
"eval_TIME_precision": 0.8064516129032258,
"eval_TIME_recall": 0.8620689655172413,
"eval_loss": 0.2750895619392395,
"eval_overall_accuracy": 0.9641485275288092,
"eval_overall_f1": 0.8612303290414879,
"eval_overall_precision": 0.8337950138504155,
"eval_overall_recall": 0.8905325443786982,
"eval_runtime": 0.3236,
"eval_samples_per_second": 577.827,
"eval_steps_per_second": 9.27,
"step": 3922
},
{
"epoch": 38.0,
"grad_norm": 0.002975118113681674,
"learning_rate": 3.1e-05,
"loss": 0.0032,
"step": 4028
},
{
"epoch": 38.0,
"eval_LOCATION_f1": 0.8344370860927153,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7682926829268293,
"eval_LOCATION_recall": 0.9130434782608695,
"eval_ORGANIZATION_f1": 0.7933884297520662,
"eval_ORGANIZATION_number": 58,
"eval_ORGANIZATION_precision": 0.7619047619047619,
"eval_ORGANIZATION_recall": 0.8275862068965517,
"eval_PERSON_f1": 0.9096774193548387,
"eval_PERSON_number": 152,
"eval_PERSON_precision": 0.8924050632911392,
"eval_PERSON_recall": 0.9276315789473685,
"eval_QUANTITY_f1": 0.8253968253968254,
"eval_QUANTITY_number": 30,
"eval_QUANTITY_precision": 0.7878787878787878,
"eval_QUANTITY_recall": 0.8666666666666667,
"eval_TIME_f1": 0.847457627118644,
"eval_TIME_number": 29,
"eval_TIME_precision": 0.8333333333333334,
"eval_TIME_recall": 0.8620689655172413,
"eval_loss": 0.292982280254364,
"eval_overall_accuracy": 0.9669654289372599,
"eval_overall_f1": 0.8607954545454546,
"eval_overall_precision": 0.8278688524590164,
"eval_overall_recall": 0.8964497041420119,
"eval_runtime": 0.3205,
"eval_samples_per_second": 583.486,
"eval_steps_per_second": 9.361,
"step": 4028
},
{
"epoch": 39.0,
"grad_norm": 0.048705920577049255,
"learning_rate": 3.05e-05,
"loss": 0.0014,
"step": 4134
},
{
"epoch": 39.0,
"eval_LOCATION_f1": 0.888888888888889,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.8533333333333334,
"eval_LOCATION_recall": 0.927536231884058,
"eval_ORGANIZATION_f1": 0.7833333333333333,
"eval_ORGANIZATION_number": 58,
"eval_ORGANIZATION_precision": 0.7580645161290323,
"eval_ORGANIZATION_recall": 0.8103448275862069,
"eval_PERSON_f1": 0.9009584664536742,
"eval_PERSON_number": 152,
"eval_PERSON_precision": 0.8757763975155279,
"eval_PERSON_recall": 0.9276315789473685,
"eval_QUANTITY_f1": 0.8387096774193549,
"eval_QUANTITY_number": 30,
"eval_QUANTITY_precision": 0.8125,
"eval_QUANTITY_recall": 0.8666666666666667,
"eval_TIME_f1": 0.847457627118644,
"eval_TIME_number": 29,
"eval_TIME_precision": 0.8333333333333334,
"eval_TIME_recall": 0.8620689655172413,
"eval_loss": 0.26422762870788574,
"eval_overall_accuracy": 0.9677336747759283,
"eval_overall_f1": 0.8681948424068767,
"eval_overall_precision": 0.8416666666666667,
"eval_overall_recall": 0.8964497041420119,
"eval_runtime": 0.3204,
"eval_samples_per_second": 583.697,
"eval_steps_per_second": 9.364,
"step": 4134
},
{
"epoch": 40.0,
"grad_norm": 0.0028175306506454945,
"learning_rate": 3e-05,
"loss": 0.0022,
"step": 4240
},
{
"epoch": 40.0,
"eval_LOCATION_f1": 0.84,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7777777777777778,
"eval_LOCATION_recall": 0.9130434782608695,
"eval_ORGANIZATION_f1": 0.7479674796747967,
"eval_ORGANIZATION_number": 58,
"eval_ORGANIZATION_precision": 0.7076923076923077,
"eval_ORGANIZATION_recall": 0.7931034482758621,
"eval_PERSON_f1": 0.9032258064516129,
"eval_PERSON_number": 152,
"eval_PERSON_precision": 0.8860759493670886,
"eval_PERSON_recall": 0.9210526315789473,
"eval_QUANTITY_f1": 0.8387096774193549,
"eval_QUANTITY_number": 30,
"eval_QUANTITY_precision": 0.8125,
"eval_QUANTITY_recall": 0.8666666666666667,
"eval_TIME_f1": 0.8620689655172413,
"eval_TIME_number": 29,
"eval_TIME_precision": 0.8620689655172413,
"eval_TIME_recall": 0.8620689655172413,
"eval_loss": 0.30111193656921387,
"eval_overall_accuracy": 0.9661971830985916,
"eval_overall_f1": 0.8534850640113798,
"eval_overall_precision": 0.821917808219178,
"eval_overall_recall": 0.8875739644970414,
"eval_runtime": 0.3358,
"eval_samples_per_second": 556.909,
"eval_steps_per_second": 8.934,
"step": 4240
},
{
"epoch": 41.0,
"grad_norm": 0.017286457121372223,
"learning_rate": 2.95e-05,
"loss": 0.0023,
"step": 4346
},
{
"epoch": 41.0,
"eval_LOCATION_f1": 0.8689655172413793,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.8289473684210527,
"eval_LOCATION_recall": 0.9130434782608695,
"eval_ORGANIZATION_f1": 0.752136752136752,
"eval_ORGANIZATION_number": 58,
"eval_ORGANIZATION_precision": 0.7457627118644068,
"eval_ORGANIZATION_recall": 0.7586206896551724,
"eval_PERSON_f1": 0.8974358974358975,
"eval_PERSON_number": 152,
"eval_PERSON_precision": 0.875,
"eval_PERSON_recall": 0.9210526315789473,
"eval_QUANTITY_f1": 0.8387096774193549,
"eval_QUANTITY_number": 30,
"eval_QUANTITY_precision": 0.8125,
"eval_QUANTITY_recall": 0.8666666666666667,
"eval_TIME_f1": 0.8620689655172413,
"eval_TIME_number": 29,
"eval_TIME_precision": 0.8620689655172413,
"eval_TIME_recall": 0.8620689655172413,
"eval_loss": 0.29203903675079346,
"eval_overall_accuracy": 0.9659411011523688,
"eval_overall_f1": 0.8587896253602305,
"eval_overall_precision": 0.8370786516853933,
"eval_overall_recall": 0.8816568047337278,
"eval_runtime": 0.3197,
"eval_samples_per_second": 584.864,
"eval_steps_per_second": 9.383,
"step": 4346
},
{
"epoch": 42.0,
"grad_norm": 0.021444261074066162,
"learning_rate": 2.9e-05,
"loss": 0.0026,
"step": 4452
},
{
"epoch": 42.0,
"eval_LOCATION_f1": 0.8648648648648648,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.810126582278481,
"eval_LOCATION_recall": 0.927536231884058,
"eval_ORGANIZATION_f1": 0.7868852459016394,
"eval_ORGANIZATION_number": 58,
"eval_ORGANIZATION_precision": 0.75,
"eval_ORGANIZATION_recall": 0.8275862068965517,
"eval_PERSON_f1": 0.8974358974358975,
"eval_PERSON_number": 152,
"eval_PERSON_precision": 0.875,
"eval_PERSON_recall": 0.9210526315789473,
"eval_QUANTITY_f1": 0.8387096774193549,
"eval_QUANTITY_number": 30,
"eval_QUANTITY_precision": 0.8125,
"eval_QUANTITY_recall": 0.8666666666666667,
"eval_TIME_f1": 0.8333333333333334,
"eval_TIME_number": 29,
"eval_TIME_precision": 0.8064516129032258,
"eval_TIME_recall": 0.8620689655172413,
"eval_loss": 0.2897973358631134,
"eval_overall_accuracy": 0.9646606914212548,
"eval_overall_f1": 0.8607954545454546,
"eval_overall_precision": 0.8278688524590164,
"eval_overall_recall": 0.8964497041420119,
"eval_runtime": 0.3355,
"eval_samples_per_second": 557.358,
"eval_steps_per_second": 8.942,
"step": 4452
},
{
"epoch": 43.0,
"grad_norm": 0.01654691994190216,
"learning_rate": 2.8499999999999998e-05,
"loss": 0.0015,
"step": 4558
},
{
"epoch": 43.0,
"eval_LOCATION_f1": 0.8533333333333333,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7901234567901234,
"eval_LOCATION_recall": 0.927536231884058,
"eval_ORGANIZATION_f1": 0.7819548872180451,
"eval_ORGANIZATION_number": 58,
"eval_ORGANIZATION_precision": 0.6933333333333334,
"eval_ORGANIZATION_recall": 0.896551724137931,
"eval_PERSON_f1": 0.9067524115755626,
"eval_PERSON_number": 152,
"eval_PERSON_precision": 0.8867924528301887,
"eval_PERSON_recall": 0.9276315789473685,
"eval_QUANTITY_f1": 0.8253968253968254,
"eval_QUANTITY_number": 30,
"eval_QUANTITY_precision": 0.7878787878787878,
"eval_QUANTITY_recall": 0.8666666666666667,
"eval_TIME_f1": 0.847457627118644,
"eval_TIME_number": 29,
"eval_TIME_precision": 0.8333333333333334,
"eval_TIME_recall": 0.8620689655172413,
"eval_loss": 0.31039759516716003,
"eval_overall_accuracy": 0.9649167733674776,
"eval_overall_f1": 0.8603351955307262,
"eval_overall_precision": 0.8148148148148148,
"eval_overall_recall": 0.9112426035502958,
"eval_runtime": 0.3294,
"eval_samples_per_second": 567.728,
"eval_steps_per_second": 9.108,
"step": 4558
},
{
"epoch": 44.0,
"grad_norm": 0.013932665809988976,
"learning_rate": 2.8000000000000003e-05,
"loss": 0.0016,
"step": 4664
},
{
"epoch": 44.0,
"eval_LOCATION_f1": 0.8456375838926175,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7875,
"eval_LOCATION_recall": 0.9130434782608695,
"eval_ORGANIZATION_f1": 0.7999999999999999,
"eval_ORGANIZATION_number": 58,
"eval_ORGANIZATION_precision": 0.746268656716418,
"eval_ORGANIZATION_recall": 0.8620689655172413,
"eval_PERSON_f1": 0.9032258064516129,
"eval_PERSON_number": 152,
"eval_PERSON_precision": 0.8860759493670886,
"eval_PERSON_recall": 0.9210526315789473,
"eval_QUANTITY_f1": 0.8387096774193549,
"eval_QUANTITY_number": 30,
"eval_QUANTITY_precision": 0.8125,
"eval_QUANTITY_recall": 0.8666666666666667,
"eval_TIME_f1": 0.8421052631578947,
"eval_TIME_number": 29,
"eval_TIME_precision": 0.8571428571428571,
"eval_TIME_recall": 0.8275862068965517,
"eval_loss": 0.30845847725868225,
"eval_overall_accuracy": 0.9641485275288092,
"eval_overall_f1": 0.8620199146514936,
"eval_overall_precision": 0.8301369863013699,
"eval_overall_recall": 0.8964497041420119,
"eval_runtime": 0.3211,
"eval_samples_per_second": 582.336,
"eval_steps_per_second": 9.342,
"step": 4664
},
{
"epoch": 45.0,
"grad_norm": 0.011009820736944675,
"learning_rate": 2.7500000000000004e-05,
"loss": 0.0018,
"step": 4770
},
{
"epoch": 45.0,
"eval_LOCATION_f1": 0.8590604026845639,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.8,
"eval_LOCATION_recall": 0.927536231884058,
"eval_ORGANIZATION_f1": 0.7596899224806202,
"eval_ORGANIZATION_number": 58,
"eval_ORGANIZATION_precision": 0.6901408450704225,
"eval_ORGANIZATION_recall": 0.8448275862068966,
"eval_PERSON_f1": 0.9003215434083601,
"eval_PERSON_number": 152,
"eval_PERSON_precision": 0.8805031446540881,
"eval_PERSON_recall": 0.9210526315789473,
"eval_QUANTITY_f1": 0.8253968253968254,
"eval_QUANTITY_number": 30,
"eval_QUANTITY_precision": 0.7878787878787878,
"eval_QUANTITY_recall": 0.8666666666666667,
"eval_TIME_f1": 0.847457627118644,
"eval_TIME_number": 29,
"eval_TIME_precision": 0.8333333333333334,
"eval_TIME_recall": 0.8620689655172413,
"eval_loss": 0.3025805950164795,
"eval_overall_accuracy": 0.9615877080665813,
"eval_overall_f1": 0.8551336146272854,
"eval_overall_precision": 0.8150134048257373,
"eval_overall_recall": 0.8994082840236687,
"eval_runtime": 0.3247,
"eval_samples_per_second": 575.917,
"eval_steps_per_second": 9.239,
"step": 4770
},
{
"epoch": 46.0,
"grad_norm": 13.414834022521973,
"learning_rate": 2.7000000000000002e-05,
"loss": 0.0033,
"step": 4876
},
{
"epoch": 46.0,
"eval_LOCATION_f1": 0.8366013071895425,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7619047619047619,
"eval_LOCATION_recall": 0.927536231884058,
"eval_ORGANIZATION_f1": 0.7479674796747967,
"eval_ORGANIZATION_number": 58,
"eval_ORGANIZATION_precision": 0.7076923076923077,
"eval_ORGANIZATION_recall": 0.7931034482758621,
"eval_PERSON_f1": 0.8945686900958467,
"eval_PERSON_number": 152,
"eval_PERSON_precision": 0.8695652173913043,
"eval_PERSON_recall": 0.9210526315789473,
"eval_QUANTITY_f1": 0.8253968253968254,
"eval_QUANTITY_number": 30,
"eval_QUANTITY_precision": 0.7878787878787878,
"eval_QUANTITY_recall": 0.8666666666666667,
"eval_TIME_f1": 0.8333333333333334,
"eval_TIME_number": 29,
"eval_TIME_precision": 0.8064516129032258,
"eval_TIME_recall": 0.8620689655172413,
"eval_loss": 0.2862217128276825,
"eval_overall_accuracy": 0.963124199743918,
"eval_overall_f1": 0.8455056179775281,
"eval_overall_precision": 0.8048128342245989,
"eval_overall_recall": 0.8905325443786982,
"eval_runtime": 0.335,
"eval_samples_per_second": 558.225,
"eval_steps_per_second": 8.955,
"step": 4876
},
{
"epoch": 47.0,
"grad_norm": 0.003819537116214633,
"learning_rate": 2.6500000000000004e-05,
"loss": 0.0007,
"step": 4982
},
{
"epoch": 47.0,
"eval_LOCATION_f1": 0.888888888888889,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.8533333333333334,
"eval_LOCATION_recall": 0.927536231884058,
"eval_ORGANIZATION_f1": 0.7666666666666667,
"eval_ORGANIZATION_number": 58,
"eval_ORGANIZATION_precision": 0.7419354838709677,
"eval_ORGANIZATION_recall": 0.7931034482758621,
"eval_PERSON_f1": 0.9126213592233009,
"eval_PERSON_number": 152,
"eval_PERSON_precision": 0.8980891719745223,
"eval_PERSON_recall": 0.9276315789473685,
"eval_QUANTITY_f1": 0.8387096774193549,
"eval_QUANTITY_number": 30,
"eval_QUANTITY_precision": 0.8125,
"eval_QUANTITY_recall": 0.8666666666666667,
"eval_TIME_f1": 0.8620689655172413,
"eval_TIME_number": 29,
"eval_TIME_precision": 0.8620689655172413,
"eval_TIME_recall": 0.8620689655172413,
"eval_loss": 0.28280648589134216,
"eval_overall_accuracy": 0.9690140845070423,
"eval_overall_f1": 0.8715728715728714,
"eval_overall_precision": 0.8507042253521127,
"eval_overall_recall": 0.893491124260355,
"eval_runtime": 0.3231,
"eval_samples_per_second": 578.72,
"eval_steps_per_second": 9.284,
"step": 4982
},
{
"epoch": 48.0,
"grad_norm": 0.046515222638845444,
"learning_rate": 2.6000000000000002e-05,
"loss": 0.0018,
"step": 5088
},
{
"epoch": 48.0,
"eval_LOCATION_f1": 0.8767123287671235,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.8311688311688312,
"eval_LOCATION_recall": 0.927536231884058,
"eval_ORGANIZATION_f1": 0.75,
"eval_ORGANIZATION_number": 58,
"eval_ORGANIZATION_precision": 0.6857142857142857,
"eval_ORGANIZATION_recall": 0.8275862068965517,
"eval_PERSON_f1": 0.9032258064516129,
"eval_PERSON_number": 152,
"eval_PERSON_precision": 0.8860759493670886,
"eval_PERSON_recall": 0.9210526315789473,
"eval_QUANTITY_f1": 0.8387096774193549,
"eval_QUANTITY_number": 30,
"eval_QUANTITY_precision": 0.8125,
"eval_QUANTITY_recall": 0.8666666666666667,
"eval_TIME_f1": 0.847457627118644,
"eval_TIME_number": 29,
"eval_TIME_precision": 0.8333333333333334,
"eval_TIME_recall": 0.8620689655172413,
"eval_loss": 0.2690236270427704,
"eval_overall_accuracy": 0.9664532650448143,
"eval_overall_f1": 0.8595744680851063,
"eval_overall_precision": 0.8256130790190735,
"eval_overall_recall": 0.8964497041420119,
"eval_runtime": 0.3232,
"eval_samples_per_second": 578.625,
"eval_steps_per_second": 9.283,
"step": 5088
},
{
"epoch": 49.0,
"grad_norm": 0.002773936837911606,
"learning_rate": 2.5500000000000003e-05,
"loss": 0.0005,
"step": 5194
},
{
"epoch": 49.0,
"eval_LOCATION_f1": 0.870748299319728,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.8205128205128205,
"eval_LOCATION_recall": 0.927536231884058,
"eval_ORGANIZATION_f1": 0.7317073170731708,
"eval_ORGANIZATION_number": 58,
"eval_ORGANIZATION_precision": 0.6923076923076923,
"eval_ORGANIZATION_recall": 0.7758620689655172,
"eval_PERSON_f1": 0.8881789137380192,
"eval_PERSON_number": 152,
"eval_PERSON_precision": 0.8633540372670807,
"eval_PERSON_recall": 0.9144736842105263,
"eval_QUANTITY_f1": 0.870967741935484,
"eval_QUANTITY_number": 30,
"eval_QUANTITY_precision": 0.84375,
"eval_QUANTITY_recall": 0.9,
"eval_TIME_f1": 0.8620689655172413,
"eval_TIME_number": 29,
"eval_TIME_precision": 0.8620689655172413,
"eval_TIME_recall": 0.8620689655172413,
"eval_loss": 0.28763094544410706,
"eval_overall_accuracy": 0.9641485275288092,
"eval_overall_f1": 0.8534850640113798,
"eval_overall_precision": 0.821917808219178,
"eval_overall_recall": 0.8875739644970414,
"eval_runtime": 0.3215,
"eval_samples_per_second": 581.6,
"eval_steps_per_second": 9.33,
"step": 5194
},
{
"epoch": 50.0,
"grad_norm": 0.001465336070396006,
"learning_rate": 2.5e-05,
"loss": 0.0017,
"step": 5300
},
{
"epoch": 50.0,
"eval_LOCATION_f1": 0.8648648648648648,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.810126582278481,
"eval_LOCATION_recall": 0.927536231884058,
"eval_ORGANIZATION_f1": 0.711864406779661,
"eval_ORGANIZATION_number": 58,
"eval_ORGANIZATION_precision": 0.7,
"eval_ORGANIZATION_recall": 0.7241379310344828,
"eval_PERSON_f1": 0.9061488673139159,
"eval_PERSON_number": 152,
"eval_PERSON_precision": 0.89171974522293,
"eval_PERSON_recall": 0.9210526315789473,
"eval_QUANTITY_f1": 0.8387096774193549,
"eval_QUANTITY_number": 30,
"eval_QUANTITY_precision": 0.8125,
"eval_QUANTITY_recall": 0.8666666666666667,
"eval_TIME_f1": 0.8333333333333334,
"eval_TIME_number": 29,
"eval_TIME_precision": 0.8064516129032258,
"eval_TIME_recall": 0.8620689655172413,
"eval_loss": 0.3069976568222046,
"eval_overall_accuracy": 0.964404609475032,
"eval_overall_f1": 0.8522238163558107,
"eval_overall_precision": 0.8272980501392758,
"eval_overall_recall": 0.878698224852071,
"eval_runtime": 0.3366,
"eval_samples_per_second": 555.511,
"eval_steps_per_second": 8.912,
"step": 5300
},
{
"epoch": 51.0,
"grad_norm": 0.0014170885551720858,
"learning_rate": 2.45e-05,
"loss": 0.0009,
"step": 5406
},
{
"epoch": 51.0,
"eval_LOCATION_f1": 0.870748299319728,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.8205128205128205,
"eval_LOCATION_recall": 0.927536231884058,
"eval_ORGANIZATION_f1": 0.7812500000000001,
"eval_ORGANIZATION_number": 58,
"eval_ORGANIZATION_precision": 0.7142857142857143,
"eval_ORGANIZATION_recall": 0.8620689655172413,
"eval_PERSON_f1": 0.9061488673139159,
"eval_PERSON_number": 152,
"eval_PERSON_precision": 0.89171974522293,
"eval_PERSON_recall": 0.9210526315789473,
"eval_QUANTITY_f1": 0.8387096774193549,
"eval_QUANTITY_number": 30,
"eval_QUANTITY_precision": 0.8125,
"eval_QUANTITY_recall": 0.8666666666666667,
"eval_TIME_f1": 0.847457627118644,
"eval_TIME_number": 29,
"eval_TIME_precision": 0.8333333333333334,
"eval_TIME_recall": 0.8620689655172413,
"eval_loss": 0.3090084195137024,
"eval_overall_accuracy": 0.9649167733674776,
"eval_overall_f1": 0.8652482269503546,
"eval_overall_precision": 0.8310626702997275,
"eval_overall_recall": 0.9023668639053254,
"eval_runtime": 0.3236,
"eval_samples_per_second": 577.785,
"eval_steps_per_second": 9.269,
"step": 5406
},
{
"epoch": 52.0,
"grad_norm": 0.009222417138516903,
"learning_rate": 2.4e-05,
"loss": 0.0005,
"step": 5512
},
{
"epoch": 52.0,
"eval_LOCATION_f1": 0.8590604026845639,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.8,
"eval_LOCATION_recall": 0.927536231884058,
"eval_ORGANIZATION_f1": 0.7377049180327868,
"eval_ORGANIZATION_number": 58,
"eval_ORGANIZATION_precision": 0.703125,
"eval_ORGANIZATION_recall": 0.7758620689655172,
"eval_PERSON_f1": 0.8996763754045308,
"eval_PERSON_number": 152,
"eval_PERSON_precision": 0.8853503184713376,
"eval_PERSON_recall": 0.9144736842105263,
"eval_QUANTITY_f1": 0.8387096774193549,
"eval_QUANTITY_number": 30,
"eval_QUANTITY_precision": 0.8125,
"eval_QUANTITY_recall": 0.8666666666666667,
"eval_TIME_f1": 0.8813559322033899,
"eval_TIME_number": 29,
"eval_TIME_precision": 0.8666666666666667,
"eval_TIME_recall": 0.896551724137931,
"eval_loss": 0.3099108636379242,
"eval_overall_accuracy": 0.9656850192061459,
"eval_overall_f1": 0.855920114122682,
"eval_overall_precision": 0.8264462809917356,
"eval_overall_recall": 0.8875739644970414,
"eval_runtime": 0.3275,
"eval_samples_per_second": 570.979,
"eval_steps_per_second": 9.16,
"step": 5512
},
{
"epoch": 53.0,
"grad_norm": 0.0005486037116497755,
"learning_rate": 2.35e-05,
"loss": 0.001,
"step": 5618
},
{
"epoch": 53.0,
"eval_LOCATION_f1": 0.8533333333333333,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7901234567901234,
"eval_LOCATION_recall": 0.927536231884058,
"eval_ORGANIZATION_f1": 0.7666666666666667,
"eval_ORGANIZATION_number": 58,
"eval_ORGANIZATION_precision": 0.7419354838709677,
"eval_ORGANIZATION_recall": 0.7931034482758621,
"eval_PERSON_f1": 0.8996763754045308,
"eval_PERSON_number": 152,
"eval_PERSON_precision": 0.8853503184713376,
"eval_PERSON_recall": 0.9144736842105263,
"eval_QUANTITY_f1": 0.8387096774193549,
"eval_QUANTITY_number": 30,
"eval_QUANTITY_precision": 0.8125,
"eval_QUANTITY_recall": 0.8666666666666667,
"eval_TIME_f1": 0.8666666666666666,
"eval_TIME_number": 29,
"eval_TIME_precision": 0.8387096774193549,
"eval_TIME_recall": 0.896551724137931,
"eval_loss": 0.31158438324928284,
"eval_overall_accuracy": 0.9649167733674776,
"eval_overall_f1": 0.8587731811697575,
"eval_overall_precision": 0.8292011019283747,
"eval_overall_recall": 0.8905325443786982,
"eval_runtime": 0.3209,
"eval_samples_per_second": 582.696,
"eval_steps_per_second": 9.348,
"step": 5618
},
{
"epoch": 54.0,
"grad_norm": 0.0006028018542565405,
"learning_rate": 2.3000000000000003e-05,
"loss": 0.0006,
"step": 5724
},
{
"epoch": 54.0,
"eval_LOCATION_f1": 0.8533333333333333,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7901234567901234,
"eval_LOCATION_recall": 0.927536231884058,
"eval_ORGANIZATION_f1": 0.7377049180327868,
"eval_ORGANIZATION_number": 58,
"eval_ORGANIZATION_precision": 0.703125,
"eval_ORGANIZATION_recall": 0.7758620689655172,
"eval_PERSON_f1": 0.9055374592833876,
"eval_PERSON_number": 152,
"eval_PERSON_precision": 0.896774193548387,
"eval_PERSON_recall": 0.9144736842105263,
"eval_QUANTITY_f1": 0.8387096774193549,
"eval_QUANTITY_number": 30,
"eval_QUANTITY_precision": 0.8125,
"eval_QUANTITY_recall": 0.8666666666666667,
"eval_TIME_f1": 0.847457627118644,
"eval_TIME_number": 29,
"eval_TIME_precision": 0.8333333333333334,
"eval_TIME_recall": 0.8620689655172413,
"eval_loss": 0.317971795797348,
"eval_overall_accuracy": 0.964404609475032,
"eval_overall_f1": 0.8542857142857142,
"eval_overall_precision": 0.8259668508287292,
"eval_overall_recall": 0.8846153846153846,
"eval_runtime": 0.3274,
"eval_samples_per_second": 571.109,
"eval_steps_per_second": 9.162,
"step": 5724
},
{
"epoch": 55.0,
"grad_norm": 0.0006948837544769049,
"learning_rate": 2.25e-05,
"loss": 0.0004,
"step": 5830
},
{
"epoch": 55.0,
"eval_LOCATION_f1": 0.8590604026845639,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.8,
"eval_LOCATION_recall": 0.927536231884058,
"eval_ORGANIZATION_f1": 0.7500000000000001,
"eval_ORGANIZATION_number": 58,
"eval_ORGANIZATION_precision": 0.7258064516129032,
"eval_ORGANIZATION_recall": 0.7758620689655172,
"eval_PERSON_f1": 0.9032258064516129,
"eval_PERSON_number": 152,
"eval_PERSON_precision": 0.8860759493670886,
"eval_PERSON_recall": 0.9210526315789473,
"eval_QUANTITY_f1": 0.8387096774193549,
"eval_QUANTITY_number": 30,
"eval_QUANTITY_precision": 0.8125,
"eval_QUANTITY_recall": 0.8666666666666667,
"eval_TIME_f1": 0.8620689655172413,
"eval_TIME_number": 29,
"eval_TIME_precision": 0.8620689655172413,
"eval_TIME_recall": 0.8620689655172413,
"eval_loss": 0.32179853320121765,
"eval_overall_accuracy": 0.9646606914212548,
"eval_overall_f1": 0.8583690987124463,
"eval_overall_precision": 0.8310249307479224,
"eval_overall_recall": 0.8875739644970414,
"eval_runtime": 0.3207,
"eval_samples_per_second": 583.185,
"eval_steps_per_second": 9.356,
"step": 5830
},
{
"epoch": 56.0,
"grad_norm": 0.0012037695851176977,
"learning_rate": 2.2000000000000003e-05,
"loss": 0.0006,
"step": 5936
},
{
"epoch": 56.0,
"eval_LOCATION_f1": 0.8533333333333333,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7901234567901234,
"eval_LOCATION_recall": 0.927536231884058,
"eval_ORGANIZATION_f1": 0.7333333333333333,
"eval_ORGANIZATION_number": 58,
"eval_ORGANIZATION_precision": 0.7096774193548387,
"eval_ORGANIZATION_recall": 0.7586206896551724,
"eval_PERSON_f1": 0.9032258064516129,
"eval_PERSON_number": 152,
"eval_PERSON_precision": 0.8860759493670886,
"eval_PERSON_recall": 0.9210526315789473,
"eval_QUANTITY_f1": 0.8387096774193549,
"eval_QUANTITY_number": 30,
"eval_QUANTITY_precision": 0.8125,
"eval_QUANTITY_recall": 0.8666666666666667,
"eval_TIME_f1": 0.8333333333333334,
"eval_TIME_number": 29,
"eval_TIME_precision": 0.8064516129032258,
"eval_TIME_recall": 0.8620689655172413,
"eval_loss": 0.33105283975601196,
"eval_overall_accuracy": 0.9633802816901409,
"eval_overall_f1": 0.8518518518518519,
"eval_overall_precision": 0.8214285714285714,
"eval_overall_recall": 0.8846153846153846,
"eval_runtime": 0.3391,
"eval_samples_per_second": 551.529,
"eval_steps_per_second": 8.848,
"step": 5936
},
{
"epoch": 57.0,
"grad_norm": 0.0022144129034131765,
"learning_rate": 2.15e-05,
"loss": 0.0009,
"step": 6042
},
{
"epoch": 57.0,
"eval_LOCATION_f1": 0.8476821192052981,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7804878048780488,
"eval_LOCATION_recall": 0.927536231884058,
"eval_ORGANIZATION_f1": 0.7419354838709677,
"eval_ORGANIZATION_number": 58,
"eval_ORGANIZATION_precision": 0.696969696969697,
"eval_ORGANIZATION_recall": 0.7931034482758621,
"eval_PERSON_f1": 0.896774193548387,
"eval_PERSON_number": 152,
"eval_PERSON_precision": 0.879746835443038,
"eval_PERSON_recall": 0.9144736842105263,
"eval_QUANTITY_f1": 0.8387096774193549,
"eval_QUANTITY_number": 30,
"eval_QUANTITY_precision": 0.8125,
"eval_QUANTITY_recall": 0.8666666666666667,
"eval_TIME_f1": 0.8333333333333334,
"eval_TIME_number": 29,
"eval_TIME_precision": 0.8064516129032258,
"eval_TIME_recall": 0.8620689655172413,
"eval_loss": 0.31793665885925293,
"eval_overall_accuracy": 0.964404609475032,
"eval_overall_f1": 0.8486562942008485,
"eval_overall_precision": 0.8130081300813008,
"eval_overall_recall": 0.8875739644970414,
"eval_runtime": 0.3249,
"eval_samples_per_second": 575.562,
"eval_steps_per_second": 9.234,
"step": 6042
},
{
"epoch": 58.0,
"grad_norm": 0.0016710077179595828,
"learning_rate": 2.1e-05,
"loss": 0.002,
"step": 6148
},
{
"epoch": 58.0,
"eval_LOCATION_f1": 0.870748299319728,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.8205128205128205,
"eval_LOCATION_recall": 0.927536231884058,
"eval_ORGANIZATION_f1": 0.6725663716814159,
"eval_ORGANIZATION_number": 58,
"eval_ORGANIZATION_precision": 0.6909090909090909,
"eval_ORGANIZATION_recall": 0.6551724137931034,
"eval_PERSON_f1": 0.9155844155844156,
"eval_PERSON_number": 152,
"eval_PERSON_precision": 0.9038461538461539,
"eval_PERSON_recall": 0.9276315789473685,
"eval_QUANTITY_f1": 0.8064516129032259,
"eval_QUANTITY_number": 30,
"eval_QUANTITY_precision": 0.78125,
"eval_QUANTITY_recall": 0.8333333333333334,
"eval_TIME_f1": 0.896551724137931,
"eval_TIME_number": 29,
"eval_TIME_precision": 0.896551724137931,
"eval_TIME_recall": 0.896551724137931,
"eval_loss": 0.27503037452697754,
"eval_overall_accuracy": 0.9638924455825865,
"eval_overall_f1": 0.8546511627906976,
"eval_overall_precision": 0.84,
"eval_overall_recall": 0.8698224852071006,
"eval_runtime": 0.3317,
"eval_samples_per_second": 563.712,
"eval_steps_per_second": 9.044,
"step": 6148
},
{
"epoch": 59.0,
"grad_norm": 0.03837126865983009,
"learning_rate": 2.05e-05,
"loss": 0.0018,
"step": 6254
},
{
"epoch": 59.0,
"eval_LOCATION_f1": 0.8648648648648648,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.810126582278481,
"eval_LOCATION_recall": 0.927536231884058,
"eval_ORGANIZATION_f1": 0.7540983606557378,
"eval_ORGANIZATION_number": 58,
"eval_ORGANIZATION_precision": 0.71875,
"eval_ORGANIZATION_recall": 0.7931034482758621,
"eval_PERSON_f1": 0.8996763754045308,
"eval_PERSON_number": 152,
"eval_PERSON_precision": 0.8853503184713376,
"eval_PERSON_recall": 0.9144736842105263,
"eval_QUANTITY_f1": 0.8253968253968254,
"eval_QUANTITY_number": 30,
"eval_QUANTITY_precision": 0.7878787878787878,
"eval_QUANTITY_recall": 0.8666666666666667,
"eval_TIME_f1": 0.8771929824561403,
"eval_TIME_number": 29,
"eval_TIME_precision": 0.8928571428571429,
"eval_TIME_recall": 0.8620689655172413,
"eval_loss": 0.29145359992980957,
"eval_overall_accuracy": 0.9656850192061459,
"eval_overall_f1": 0.8583690987124463,
"eval_overall_precision": 0.8310249307479224,
"eval_overall_recall": 0.8875739644970414,
"eval_runtime": 0.3233,
"eval_samples_per_second": 578.416,
"eval_steps_per_second": 9.279,
"step": 6254
},
{
"epoch": 60.0,
"grad_norm": 0.10238273441791534,
"learning_rate": 2e-05,
"loss": 0.0008,
"step": 6360
},
{
"epoch": 60.0,
"eval_LOCATION_f1": 0.8648648648648648,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.810126582278481,
"eval_LOCATION_recall": 0.927536231884058,
"eval_ORGANIZATION_f1": 0.7027027027027026,
"eval_ORGANIZATION_number": 58,
"eval_ORGANIZATION_precision": 0.7358490566037735,
"eval_ORGANIZATION_recall": 0.6724137931034483,
"eval_PERSON_f1": 0.9025974025974026,
"eval_PERSON_number": 152,
"eval_PERSON_precision": 0.8910256410256411,
"eval_PERSON_recall": 0.9144736842105263,
"eval_QUANTITY_f1": 0.8387096774193549,
"eval_QUANTITY_number": 30,
"eval_QUANTITY_precision": 0.8125,
"eval_QUANTITY_recall": 0.8666666666666667,
"eval_TIME_f1": 0.8771929824561403,
"eval_TIME_number": 29,
"eval_TIME_precision": 0.8928571428571429,
"eval_TIME_recall": 0.8620689655172413,
"eval_loss": 0.31033989787101746,
"eval_overall_accuracy": 0.9649167733674776,
"eval_overall_f1": 0.8542274052478134,
"eval_overall_precision": 0.8419540229885057,
"eval_overall_recall": 0.8668639053254438,
"eval_runtime": 0.3317,
"eval_samples_per_second": 563.83,
"eval_steps_per_second": 9.045,
"step": 6360
},
{
"epoch": 61.0,
"grad_norm": 0.002005122834816575,
"learning_rate": 1.9500000000000003e-05,
"loss": 0.0013,
"step": 6466
},
{
"epoch": 61.0,
"eval_LOCATION_f1": 0.8749999999999999,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.84,
"eval_LOCATION_recall": 0.9130434782608695,
"eval_ORGANIZATION_f1": 0.7868852459016394,
"eval_ORGANIZATION_number": 58,
"eval_ORGANIZATION_precision": 0.75,
"eval_ORGANIZATION_recall": 0.8275862068965517,
"eval_PERSON_f1": 0.9003215434083601,
"eval_PERSON_number": 152,
"eval_PERSON_precision": 0.8805031446540881,
"eval_PERSON_recall": 0.9210526315789473,
"eval_QUANTITY_f1": 0.8253968253968254,
"eval_QUANTITY_number": 30,
"eval_QUANTITY_precision": 0.7878787878787878,
"eval_QUANTITY_recall": 0.8666666666666667,
"eval_TIME_f1": 0.896551724137931,
"eval_TIME_number": 29,
"eval_TIME_precision": 0.896551724137931,
"eval_TIME_recall": 0.896551724137931,
"eval_loss": 0.2831355929374695,
"eval_overall_accuracy": 0.9661971830985916,
"eval_overall_f1": 0.8681948424068767,
"eval_overall_precision": 0.8416666666666667,
"eval_overall_recall": 0.8964497041420119,
"eval_runtime": 0.3193,
"eval_samples_per_second": 585.653,
"eval_steps_per_second": 9.395,
"step": 6466
},
{
"epoch": 62.0,
"grad_norm": 0.0019113136222586036,
"learning_rate": 1.9e-05,
"loss": 0.0013,
"step": 6572
},
{
"epoch": 62.0,
"eval_LOCATION_f1": 0.870748299319728,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.8205128205128205,
"eval_LOCATION_recall": 0.927536231884058,
"eval_ORGANIZATION_f1": 0.7999999999999999,
"eval_ORGANIZATION_number": 58,
"eval_ORGANIZATION_precision": 0.746268656716418,
"eval_ORGANIZATION_recall": 0.8620689655172413,
"eval_PERSON_f1": 0.9032258064516129,
"eval_PERSON_number": 152,
"eval_PERSON_precision": 0.8860759493670886,
"eval_PERSON_recall": 0.9210526315789473,
"eval_QUANTITY_f1": 0.8387096774193549,
"eval_QUANTITY_number": 30,
"eval_QUANTITY_precision": 0.8125,
"eval_QUANTITY_recall": 0.8666666666666667,
"eval_TIME_f1": 0.896551724137931,
"eval_TIME_number": 29,
"eval_TIME_precision": 0.896551724137931,
"eval_TIME_recall": 0.896551724137931,
"eval_loss": 0.29855355620384216,
"eval_overall_accuracy": 0.967989756722151,
"eval_overall_f1": 0.8717948717948717,
"eval_overall_precision": 0.8406593406593407,
"eval_overall_recall": 0.9053254437869822,
"eval_runtime": 0.327,
"eval_samples_per_second": 571.832,
"eval_steps_per_second": 9.174,
"step": 6572
},
{
"epoch": 63.0,
"grad_norm": 0.0004677773977164179,
"learning_rate": 1.85e-05,
"loss": 0.0009,
"step": 6678
},
{
"epoch": 63.0,
"eval_LOCATION_f1": 0.8513513513513514,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7974683544303798,
"eval_LOCATION_recall": 0.9130434782608695,
"eval_ORGANIZATION_f1": 0.8064516129032258,
"eval_ORGANIZATION_number": 58,
"eval_ORGANIZATION_precision": 0.7575757575757576,
"eval_ORGANIZATION_recall": 0.8620689655172413,
"eval_PERSON_f1": 0.8881789137380192,
"eval_PERSON_number": 152,
"eval_PERSON_precision": 0.8633540372670807,
"eval_PERSON_recall": 0.9144736842105263,
"eval_QUANTITY_f1": 0.8387096774193549,
"eval_QUANTITY_number": 30,
"eval_QUANTITY_precision": 0.8125,
"eval_QUANTITY_recall": 0.8666666666666667,
"eval_TIME_f1": 0.896551724137931,
"eval_TIME_number": 29,
"eval_TIME_precision": 0.896551724137931,
"eval_TIME_recall": 0.896551724137931,
"eval_loss": 0.3033183217048645,
"eval_overall_accuracy": 0.9661971830985916,
"eval_overall_f1": 0.8624113475177306,
"eval_overall_precision": 0.8283378746594006,
"eval_overall_recall": 0.8994082840236687,
"eval_runtime": 0.3215,
"eval_samples_per_second": 581.707,
"eval_steps_per_second": 9.332,
"step": 6678
},
{
"epoch": 64.0,
"grad_norm": 0.005429080221801996,
"learning_rate": 1.8e-05,
"loss": 0.0017,
"step": 6784
},
{
"epoch": 64.0,
"eval_LOCATION_f1": 0.8476821192052981,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7804878048780488,
"eval_LOCATION_recall": 0.927536231884058,
"eval_ORGANIZATION_f1": 0.7906976744186047,
"eval_ORGANIZATION_number": 58,
"eval_ORGANIZATION_precision": 0.7183098591549296,
"eval_ORGANIZATION_recall": 0.8793103448275862,
"eval_PERSON_f1": 0.9038461538461539,
"eval_PERSON_number": 152,
"eval_PERSON_precision": 0.88125,
"eval_PERSON_recall": 0.9276315789473685,
"eval_QUANTITY_f1": 0.8253968253968254,
"eval_QUANTITY_number": 30,
"eval_QUANTITY_precision": 0.7878787878787878,
"eval_QUANTITY_recall": 0.8666666666666667,
"eval_TIME_f1": 0.8813559322033899,
"eval_TIME_number": 29,
"eval_TIME_precision": 0.8666666666666667,
"eval_TIME_recall": 0.896551724137931,
"eval_loss": 0.30157363414764404,
"eval_overall_accuracy": 0.9667093469910372,
"eval_overall_f1": 0.8627450980392156,
"eval_overall_precision": 0.8191489361702128,
"eval_overall_recall": 0.9112426035502958,
"eval_runtime": 0.3301,
"eval_samples_per_second": 566.553,
"eval_steps_per_second": 9.089,
"step": 6784
},
{
"epoch": 65.0,
"grad_norm": 0.0004326178168412298,
"learning_rate": 1.75e-05,
"loss": 0.0007,
"step": 6890
},
{
"epoch": 65.0,
"eval_LOCATION_f1": 0.8590604026845639,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.8,
"eval_LOCATION_recall": 0.927536231884058,
"eval_ORGANIZATION_f1": 0.7751937984496124,
"eval_ORGANIZATION_number": 58,
"eval_ORGANIZATION_precision": 0.704225352112676,
"eval_ORGANIZATION_recall": 0.8620689655172413,
"eval_PERSON_f1": 0.9038461538461539,
"eval_PERSON_number": 152,
"eval_PERSON_precision": 0.88125,
"eval_PERSON_recall": 0.9276315789473685,
"eval_QUANTITY_f1": 0.8253968253968254,
"eval_QUANTITY_number": 30,
"eval_QUANTITY_precision": 0.7878787878787878,
"eval_QUANTITY_recall": 0.8666666666666667,
"eval_TIME_f1": 0.896551724137931,
"eval_TIME_number": 29,
"eval_TIME_precision": 0.896551724137931,
"eval_TIME_recall": 0.896551724137931,
"eval_loss": 0.3076171875,
"eval_overall_accuracy": 0.9661971830985916,
"eval_overall_f1": 0.8635724331926863,
"eval_overall_precision": 0.8230563002680965,
"eval_overall_recall": 0.908284023668639,
"eval_runtime": 0.3217,
"eval_samples_per_second": 581.291,
"eval_steps_per_second": 9.326,
"step": 6890
},
{
"epoch": 66.0,
"grad_norm": 0.001978162443265319,
"learning_rate": 1.7000000000000003e-05,
"loss": 0.0013,
"step": 6996
},
{
"epoch": 66.0,
"eval_LOCATION_f1": 0.8571428571428572,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.8076923076923077,
"eval_LOCATION_recall": 0.9130434782608695,
"eval_ORGANIZATION_f1": 0.7999999999999999,
"eval_ORGANIZATION_number": 58,
"eval_ORGANIZATION_precision": 0.746268656716418,
"eval_ORGANIZATION_recall": 0.8620689655172413,
"eval_PERSON_f1": 0.9096774193548387,
"eval_PERSON_number": 152,
"eval_PERSON_precision": 0.8924050632911392,
"eval_PERSON_recall": 0.9276315789473685,
"eval_QUANTITY_f1": 0.8253968253968254,
"eval_QUANTITY_number": 30,
"eval_QUANTITY_precision": 0.7878787878787878,
"eval_QUANTITY_recall": 0.8666666666666667,
"eval_TIME_f1": 0.8387096774193549,
"eval_TIME_number": 29,
"eval_TIME_precision": 0.7878787878787878,
"eval_TIME_recall": 0.896551724137931,
"eval_loss": 0.2962900996208191,
"eval_overall_accuracy": 0.9638924455825865,
"eval_overall_f1": 0.8656294200848657,
"eval_overall_precision": 0.8292682926829268,
"eval_overall_recall": 0.9053254437869822,
"eval_runtime": 0.3273,
"eval_samples_per_second": 571.366,
"eval_steps_per_second": 9.166,
"step": 6996
},
{
"epoch": 67.0,
"grad_norm": 0.000865288486238569,
"learning_rate": 1.65e-05,
"loss": 0.0011,
"step": 7102
},
{
"epoch": 67.0,
"eval_LOCATION_f1": 0.8571428571428572,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.8076923076923077,
"eval_LOCATION_recall": 0.9130434782608695,
"eval_ORGANIZATION_f1": 0.7317073170731708,
"eval_ORGANIZATION_number": 58,
"eval_ORGANIZATION_precision": 0.6923076923076923,
"eval_ORGANIZATION_recall": 0.7758620689655172,
"eval_PERSON_f1": 0.8974358974358975,
"eval_PERSON_number": 152,
"eval_PERSON_precision": 0.875,
"eval_PERSON_recall": 0.9210526315789473,
"eval_QUANTITY_f1": 0.8253968253968254,
"eval_QUANTITY_number": 30,
"eval_QUANTITY_precision": 0.7878787878787878,
"eval_QUANTITY_recall": 0.8666666666666667,
"eval_TIME_f1": 0.8666666666666666,
"eval_TIME_number": 29,
"eval_TIME_precision": 0.8387096774193549,
"eval_TIME_recall": 0.896551724137931,
"eval_loss": 0.3187943994998932,
"eval_overall_accuracy": 0.9633802816901409,
"eval_overall_f1": 0.851063829787234,
"eval_overall_precision": 0.8174386920980926,
"eval_overall_recall": 0.8875739644970414,
"eval_runtime": 0.3211,
"eval_samples_per_second": 582.391,
"eval_steps_per_second": 9.343,
"step": 7102
},
{
"epoch": 68.0,
"grad_norm": 0.00021025155729148537,
"learning_rate": 1.6000000000000003e-05,
"loss": 0.0009,
"step": 7208
},
{
"epoch": 68.0,
"eval_LOCATION_f1": 0.8648648648648648,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.810126582278481,
"eval_LOCATION_recall": 0.927536231884058,
"eval_ORGANIZATION_f1": 0.784,
"eval_ORGANIZATION_number": 58,
"eval_ORGANIZATION_precision": 0.7313432835820896,
"eval_ORGANIZATION_recall": 0.8448275862068966,
"eval_PERSON_f1": 0.8987341772151899,
"eval_PERSON_number": 152,
"eval_PERSON_precision": 0.8658536585365854,
"eval_PERSON_recall": 0.9342105263157895,
"eval_QUANTITY_f1": 0.8253968253968254,
"eval_QUANTITY_number": 30,
"eval_QUANTITY_precision": 0.7878787878787878,
"eval_QUANTITY_recall": 0.8666666666666667,
"eval_TIME_f1": 0.8666666666666666,
"eval_TIME_number": 29,
"eval_TIME_precision": 0.8387096774193549,
"eval_TIME_recall": 0.896551724137931,
"eval_loss": 0.33562034368515015,
"eval_overall_accuracy": 0.964404609475032,
"eval_overall_f1": 0.8623595505617977,
"eval_overall_precision": 0.820855614973262,
"eval_overall_recall": 0.908284023668639,
"eval_runtime": 0.3272,
"eval_samples_per_second": 571.432,
"eval_steps_per_second": 9.167,
"step": 7208
},
{
"epoch": 69.0,
"grad_norm": 0.032114915549755096,
"learning_rate": 1.55e-05,
"loss": 0.001,
"step": 7314
},
{
"epoch": 69.0,
"eval_LOCATION_f1": 0.8783783783783783,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.8227848101265823,
"eval_LOCATION_recall": 0.9420289855072463,
"eval_ORGANIZATION_f1": 0.7377049180327868,
"eval_ORGANIZATION_number": 58,
"eval_ORGANIZATION_precision": 0.703125,
"eval_ORGANIZATION_recall": 0.7758620689655172,
"eval_PERSON_f1": 0.9260450160771704,
"eval_PERSON_number": 152,
"eval_PERSON_precision": 0.9056603773584906,
"eval_PERSON_recall": 0.9473684210526315,
"eval_QUANTITY_f1": 0.8253968253968254,
"eval_QUANTITY_number": 30,
"eval_QUANTITY_precision": 0.7878787878787878,
"eval_QUANTITY_recall": 0.8666666666666667,
"eval_TIME_f1": 0.8666666666666666,
"eval_TIME_number": 29,
"eval_TIME_precision": 0.8387096774193549,
"eval_TIME_recall": 0.896551724137931,
"eval_loss": 0.30885857343673706,
"eval_overall_accuracy": 0.9654289372599232,
"eval_overall_f1": 0.8693181818181819,
"eval_overall_precision": 0.8360655737704918,
"eval_overall_recall": 0.9053254437869822,
"eval_runtime": 0.3216,
"eval_samples_per_second": 581.431,
"eval_steps_per_second": 9.328,
"step": 7314
},
{
"epoch": 70.0,
"grad_norm": 0.0254677664488554,
"learning_rate": 1.5e-05,
"loss": 0.001,
"step": 7420
},
{
"epoch": 70.0,
"eval_LOCATION_f1": 0.870748299319728,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.8205128205128205,
"eval_LOCATION_recall": 0.927536231884058,
"eval_ORGANIZATION_f1": 0.8091603053435115,
"eval_ORGANIZATION_number": 58,
"eval_ORGANIZATION_precision": 0.726027397260274,
"eval_ORGANIZATION_recall": 0.9137931034482759,
"eval_PERSON_f1": 0.9102564102564101,
"eval_PERSON_number": 152,
"eval_PERSON_precision": 0.8875,
"eval_PERSON_recall": 0.9342105263157895,
"eval_QUANTITY_f1": 0.8253968253968254,
"eval_QUANTITY_number": 30,
"eval_QUANTITY_precision": 0.7878787878787878,
"eval_QUANTITY_recall": 0.8666666666666667,
"eval_TIME_f1": 0.8666666666666666,
"eval_TIME_number": 29,
"eval_TIME_precision": 0.8387096774193549,
"eval_TIME_recall": 0.896551724137931,
"eval_loss": 0.3140678107738495,
"eval_overall_accuracy": 0.9669654289372599,
"eval_overall_f1": 0.8723702664796634,
"eval_overall_precision": 0.8293333333333334,
"eval_overall_recall": 0.9201183431952663,
"eval_runtime": 0.339,
"eval_samples_per_second": 551.686,
"eval_steps_per_second": 8.851,
"step": 7420
},
{
"epoch": 71.0,
"grad_norm": 0.0020287446677684784,
"learning_rate": 1.45e-05,
"loss": 0.0006,
"step": 7526
},
{
"epoch": 71.0,
"eval_LOCATION_f1": 0.8648648648648648,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.810126582278481,
"eval_LOCATION_recall": 0.927536231884058,
"eval_ORGANIZATION_f1": 0.7777777777777778,
"eval_ORGANIZATION_number": 58,
"eval_ORGANIZATION_precision": 0.7205882352941176,
"eval_ORGANIZATION_recall": 0.8448275862068966,
"eval_PERSON_f1": 0.9320388349514562,
"eval_PERSON_number": 152,
"eval_PERSON_precision": 0.9171974522292994,
"eval_PERSON_recall": 0.9473684210526315,
"eval_QUANTITY_f1": 0.8253968253968254,
"eval_QUANTITY_number": 30,
"eval_QUANTITY_precision": 0.7878787878787878,
"eval_QUANTITY_recall": 0.8666666666666667,
"eval_TIME_f1": 0.8813559322033899,
"eval_TIME_number": 29,
"eval_TIME_precision": 0.8666666666666667,
"eval_TIME_recall": 0.896551724137931,
"eval_loss": 0.2926411032676697,
"eval_overall_accuracy": 0.9682458386683739,
"eval_overall_f1": 0.876595744680851,
"eval_overall_precision": 0.8419618528610354,
"eval_overall_recall": 0.9142011834319527,
"eval_runtime": 0.3255,
"eval_samples_per_second": 574.564,
"eval_steps_per_second": 9.218,
"step": 7526
},
{
"epoch": 72.0,
"grad_norm": 0.0008131638751365244,
"learning_rate": 1.4000000000000001e-05,
"loss": 0.0003,
"step": 7632
},
{
"epoch": 72.0,
"eval_LOCATION_f1": 0.8590604026845639,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.8,
"eval_LOCATION_recall": 0.927536231884058,
"eval_ORGANIZATION_f1": 0.7999999999999999,
"eval_ORGANIZATION_number": 58,
"eval_ORGANIZATION_precision": 0.746268656716418,
"eval_ORGANIZATION_recall": 0.8620689655172413,
"eval_PERSON_f1": 0.9255663430420712,
"eval_PERSON_number": 152,
"eval_PERSON_precision": 0.910828025477707,
"eval_PERSON_recall": 0.9407894736842105,
"eval_QUANTITY_f1": 0.8253968253968254,
"eval_QUANTITY_number": 30,
"eval_QUANTITY_precision": 0.7878787878787878,
"eval_QUANTITY_recall": 0.8666666666666667,
"eval_TIME_f1": 0.8666666666666666,
"eval_TIME_number": 29,
"eval_TIME_precision": 0.8387096774193549,
"eval_TIME_recall": 0.896551724137931,
"eval_loss": 0.316145658493042,
"eval_overall_accuracy": 0.9669654289372599,
"eval_overall_f1": 0.8753541076487252,
"eval_overall_precision": 0.8396739130434783,
"eval_overall_recall": 0.9142011834319527,
"eval_runtime": 0.3261,
"eval_samples_per_second": 573.373,
"eval_steps_per_second": 9.198,
"step": 7632
},
{
"epoch": 73.0,
"grad_norm": 0.000352115195710212,
"learning_rate": 1.3500000000000001e-05,
"loss": 0.0008,
"step": 7738
},
{
"epoch": 73.0,
"eval_LOCATION_f1": 0.8533333333333333,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7901234567901234,
"eval_LOCATION_recall": 0.927536231884058,
"eval_ORGANIZATION_f1": 0.7936507936507937,
"eval_ORGANIZATION_number": 58,
"eval_ORGANIZATION_precision": 0.7352941176470589,
"eval_ORGANIZATION_recall": 0.8620689655172413,
"eval_PERSON_f1": 0.9102564102564101,
"eval_PERSON_number": 152,
"eval_PERSON_precision": 0.8875,
"eval_PERSON_recall": 0.9342105263157895,
"eval_QUANTITY_f1": 0.8253968253968254,
"eval_QUANTITY_number": 30,
"eval_QUANTITY_precision": 0.7878787878787878,
"eval_QUANTITY_recall": 0.8666666666666667,
"eval_TIME_f1": 0.8813559322033899,
"eval_TIME_number": 29,
"eval_TIME_precision": 0.8666666666666667,
"eval_TIME_recall": 0.896551724137931,
"eval_loss": 0.31928354501724243,
"eval_overall_accuracy": 0.9674775928297055,
"eval_overall_f1": 0.867605633802817,
"eval_overall_precision": 0.8279569892473119,
"eval_overall_recall": 0.9112426035502958,
"eval_runtime": 0.3197,
"eval_samples_per_second": 584.939,
"eval_steps_per_second": 9.384,
"step": 7738
},
{
"epoch": 74.0,
"grad_norm": 0.0021537726279348135,
"learning_rate": 1.3000000000000001e-05,
"loss": 0.0007,
"step": 7844
},
{
"epoch": 74.0,
"eval_LOCATION_f1": 0.8590604026845639,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.8,
"eval_LOCATION_recall": 0.927536231884058,
"eval_ORGANIZATION_f1": 0.7868852459016394,
"eval_ORGANIZATION_number": 58,
"eval_ORGANIZATION_precision": 0.75,
"eval_ORGANIZATION_recall": 0.8275862068965517,
"eval_PERSON_f1": 0.9131832797427653,
"eval_PERSON_number": 152,
"eval_PERSON_precision": 0.8930817610062893,
"eval_PERSON_recall": 0.9342105263157895,
"eval_QUANTITY_f1": 0.8253968253968254,
"eval_QUANTITY_number": 30,
"eval_QUANTITY_precision": 0.7878787878787878,
"eval_QUANTITY_recall": 0.8666666666666667,
"eval_TIME_f1": 0.8813559322033899,
"eval_TIME_number": 29,
"eval_TIME_precision": 0.8666666666666667,
"eval_TIME_recall": 0.896551724137931,
"eval_loss": 0.3125959038734436,
"eval_overall_accuracy": 0.9661971830985916,
"eval_overall_f1": 0.8693181818181819,
"eval_overall_precision": 0.8360655737704918,
"eval_overall_recall": 0.9053254437869822,
"eval_runtime": 0.334,
"eval_samples_per_second": 559.859,
"eval_steps_per_second": 8.982,
"step": 7844
},
{
"epoch": 75.0,
"grad_norm": 0.0009629224659875035,
"learning_rate": 1.25e-05,
"loss": 0.0002,
"step": 7950
},
{
"epoch": 75.0,
"eval_LOCATION_f1": 0.8648648648648648,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.810126582278481,
"eval_LOCATION_recall": 0.927536231884058,
"eval_ORGANIZATION_f1": 0.7999999999999999,
"eval_ORGANIZATION_number": 58,
"eval_ORGANIZATION_precision": 0.7741935483870968,
"eval_ORGANIZATION_recall": 0.8275862068965517,
"eval_PERSON_f1": 0.9032258064516129,
"eval_PERSON_number": 152,
"eval_PERSON_precision": 0.8860759493670886,
"eval_PERSON_recall": 0.9210526315789473,
"eval_QUANTITY_f1": 0.8253968253968254,
"eval_QUANTITY_number": 30,
"eval_QUANTITY_precision": 0.7878787878787878,
"eval_QUANTITY_recall": 0.8666666666666667,
"eval_TIME_f1": 0.8813559322033899,
"eval_TIME_number": 29,
"eval_TIME_precision": 0.8666666666666667,
"eval_TIME_recall": 0.896551724137931,
"eval_loss": 0.31075483560562134,
"eval_overall_accuracy": 0.9656850192061459,
"eval_overall_f1": 0.8685714285714285,
"eval_overall_precision": 0.8397790055248618,
"eval_overall_recall": 0.8994082840236687,
"eval_runtime": 0.3244,
"eval_samples_per_second": 576.373,
"eval_steps_per_second": 9.247,
"step": 7950
},
{
"epoch": 76.0,
"grad_norm": 0.0005110618658363819,
"learning_rate": 1.2e-05,
"loss": 0.0003,
"step": 8056
},
{
"epoch": 76.0,
"eval_LOCATION_f1": 0.870748299319728,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.8205128205128205,
"eval_LOCATION_recall": 0.927536231884058,
"eval_ORGANIZATION_f1": 0.8160000000000001,
"eval_ORGANIZATION_number": 58,
"eval_ORGANIZATION_precision": 0.7611940298507462,
"eval_ORGANIZATION_recall": 0.8793103448275862,
"eval_PERSON_f1": 0.910828025477707,
"eval_PERSON_number": 152,
"eval_PERSON_precision": 0.8827160493827161,
"eval_PERSON_recall": 0.9407894736842105,
"eval_QUANTITY_f1": 0.8253968253968254,
"eval_QUANTITY_number": 30,
"eval_QUANTITY_precision": 0.7878787878787878,
"eval_QUANTITY_recall": 0.8666666666666667,
"eval_TIME_f1": 0.8813559322033899,
"eval_TIME_number": 29,
"eval_TIME_precision": 0.8666666666666667,
"eval_TIME_recall": 0.896551724137931,
"eval_loss": 0.3103707730770111,
"eval_overall_accuracy": 0.9667093469910372,
"eval_overall_f1": 0.8757062146892656,
"eval_overall_precision": 0.8378378378378378,
"eval_overall_recall": 0.9171597633136095,
"eval_runtime": 0.3262,
"eval_samples_per_second": 573.268,
"eval_steps_per_second": 9.197,
"step": 8056
},
{
"epoch": 77.0,
"grad_norm": 0.0007651924388483167,
"learning_rate": 1.1500000000000002e-05,
"loss": 0.0003,
"step": 8162
},
{
"epoch": 77.0,
"eval_LOCATION_f1": 0.8648648648648648,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.810126582278481,
"eval_LOCATION_recall": 0.927536231884058,
"eval_ORGANIZATION_f1": 0.8188976377952756,
"eval_ORGANIZATION_number": 58,
"eval_ORGANIZATION_precision": 0.7536231884057971,
"eval_ORGANIZATION_recall": 0.896551724137931,
"eval_PERSON_f1": 0.9196141479099678,
"eval_PERSON_number": 152,
"eval_PERSON_precision": 0.89937106918239,
"eval_PERSON_recall": 0.9407894736842105,
"eval_QUANTITY_f1": 0.8253968253968254,
"eval_QUANTITY_number": 30,
"eval_QUANTITY_precision": 0.7878787878787878,
"eval_QUANTITY_recall": 0.8666666666666667,
"eval_TIME_f1": 0.8813559322033899,
"eval_TIME_number": 29,
"eval_TIME_precision": 0.8666666666666667,
"eval_TIME_recall": 0.896551724137931,
"eval_loss": 0.3196667730808258,
"eval_overall_accuracy": 0.9682458386683739,
"eval_overall_f1": 0.8785310734463276,
"eval_overall_precision": 0.8405405405405405,
"eval_overall_recall": 0.9201183431952663,
"eval_runtime": 0.3219,
"eval_samples_per_second": 580.999,
"eval_steps_per_second": 9.321,
"step": 8162
},
{
"epoch": 78.0,
"grad_norm": 0.0005060500116087496,
"learning_rate": 1.1000000000000001e-05,
"loss": 0.0005,
"step": 8268
},
{
"epoch": 78.0,
"eval_LOCATION_f1": 0.8311688311688311,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7529411764705882,
"eval_LOCATION_recall": 0.927536231884058,
"eval_ORGANIZATION_f1": 0.7846153846153847,
"eval_ORGANIZATION_number": 58,
"eval_ORGANIZATION_precision": 0.7083333333333334,
"eval_ORGANIZATION_recall": 0.8793103448275862,
"eval_PERSON_f1": 0.9015873015873016,
"eval_PERSON_number": 152,
"eval_PERSON_precision": 0.8711656441717791,
"eval_PERSON_recall": 0.9342105263157895,
"eval_QUANTITY_f1": 0.8253968253968254,
"eval_QUANTITY_number": 30,
"eval_QUANTITY_precision": 0.7878787878787878,
"eval_QUANTITY_recall": 0.8666666666666667,
"eval_TIME_f1": 0.8666666666666666,
"eval_TIME_number": 29,
"eval_TIME_precision": 0.8387096774193549,
"eval_TIME_recall": 0.896551724137931,
"eval_loss": 0.3422912657260895,
"eval_overall_accuracy": 0.9636363636363636,
"eval_overall_f1": 0.8559556786703602,
"eval_overall_precision": 0.8046875,
"eval_overall_recall": 0.9142011834319527,
"eval_runtime": 0.3309,
"eval_samples_per_second": 565.193,
"eval_steps_per_second": 9.067,
"step": 8268
},
{
"epoch": 79.0,
"grad_norm": 0.0006566674564965069,
"learning_rate": 1.05e-05,
"loss": 0.0002,
"step": 8374
},
{
"epoch": 79.0,
"eval_LOCATION_f1": 0.870748299319728,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.8205128205128205,
"eval_LOCATION_recall": 0.927536231884058,
"eval_ORGANIZATION_f1": 0.8253968253968255,
"eval_ORGANIZATION_number": 58,
"eval_ORGANIZATION_precision": 0.7647058823529411,
"eval_ORGANIZATION_recall": 0.896551724137931,
"eval_PERSON_f1": 0.9073482428115016,
"eval_PERSON_number": 152,
"eval_PERSON_precision": 0.8819875776397516,
"eval_PERSON_recall": 0.9342105263157895,
"eval_QUANTITY_f1": 0.8253968253968254,
"eval_QUANTITY_number": 30,
"eval_QUANTITY_precision": 0.7878787878787878,
"eval_QUANTITY_recall": 0.8666666666666667,
"eval_TIME_f1": 0.8813559322033899,
"eval_TIME_number": 29,
"eval_TIME_precision": 0.8666666666666667,
"eval_TIME_recall": 0.896551724137931,
"eval_loss": 0.33246731758117676,
"eval_overall_accuracy": 0.967989756722151,
"eval_overall_f1": 0.8757062146892656,
"eval_overall_precision": 0.8378378378378378,
"eval_overall_recall": 0.9171597633136095,
"eval_runtime": 0.3216,
"eval_samples_per_second": 581.551,
"eval_steps_per_second": 9.33,
"step": 8374
},
{
"epoch": 80.0,
"grad_norm": 0.00022042440832592547,
"learning_rate": 1e-05,
"loss": 0.0002,
"step": 8480
},
{
"epoch": 80.0,
"eval_LOCATION_f1": 0.8767123287671235,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.8311688311688312,
"eval_LOCATION_recall": 0.927536231884058,
"eval_ORGANIZATION_f1": 0.7256637168141592,
"eval_ORGANIZATION_number": 58,
"eval_ORGANIZATION_precision": 0.7454545454545455,
"eval_ORGANIZATION_recall": 0.7068965517241379,
"eval_PERSON_f1": 0.9073482428115016,
"eval_PERSON_number": 152,
"eval_PERSON_precision": 0.8819875776397516,
"eval_PERSON_recall": 0.9342105263157895,
"eval_QUANTITY_f1": 0.8253968253968254,
"eval_QUANTITY_number": 30,
"eval_QUANTITY_precision": 0.7878787878787878,
"eval_QUANTITY_recall": 0.8666666666666667,
"eval_TIME_f1": 0.8813559322033899,
"eval_TIME_number": 29,
"eval_TIME_precision": 0.8666666666666667,
"eval_TIME_recall": 0.896551724137931,
"eval_loss": 0.33535081148147583,
"eval_overall_accuracy": 0.9654289372599232,
"eval_overall_f1": 0.861671469740634,
"eval_overall_precision": 0.8398876404494382,
"eval_overall_recall": 0.8846153846153846,
"eval_runtime": 0.3346,
"eval_samples_per_second": 558.874,
"eval_steps_per_second": 8.966,
"step": 8480
},
{
"epoch": 81.0,
"grad_norm": 0.0007291326764971018,
"learning_rate": 9.5e-06,
"loss": 0.0004,
"step": 8586
},
{
"epoch": 81.0,
"eval_LOCATION_f1": 0.8456375838926175,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7875,
"eval_LOCATION_recall": 0.9130434782608695,
"eval_ORGANIZATION_f1": 0.7741935483870968,
"eval_ORGANIZATION_number": 58,
"eval_ORGANIZATION_precision": 0.7272727272727273,
"eval_ORGANIZATION_recall": 0.8275862068965517,
"eval_PERSON_f1": 0.8974358974358975,
"eval_PERSON_number": 152,
"eval_PERSON_precision": 0.875,
"eval_PERSON_recall": 0.9210526315789473,
"eval_QUANTITY_f1": 0.8253968253968254,
"eval_QUANTITY_number": 30,
"eval_QUANTITY_precision": 0.7878787878787878,
"eval_QUANTITY_recall": 0.8666666666666667,
"eval_TIME_f1": 0.8666666666666666,
"eval_TIME_number": 29,
"eval_TIME_precision": 0.8387096774193549,
"eval_TIME_recall": 0.896551724137931,
"eval_loss": 0.3405434489250183,
"eval_overall_accuracy": 0.9641485275288092,
"eval_overall_f1": 0.8559322033898306,
"eval_overall_precision": 0.8189189189189189,
"eval_overall_recall": 0.8964497041420119,
"eval_runtime": 0.3228,
"eval_samples_per_second": 579.316,
"eval_steps_per_second": 9.294,
"step": 8586
},
{
"epoch": 82.0,
"grad_norm": 0.00018406176241114736,
"learning_rate": 9e-06,
"loss": 0.0002,
"step": 8692
},
{
"epoch": 82.0,
"eval_LOCATION_f1": 0.8767123287671235,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.8311688311688312,
"eval_LOCATION_recall": 0.927536231884058,
"eval_ORGANIZATION_f1": 0.7563025210084033,
"eval_ORGANIZATION_number": 58,
"eval_ORGANIZATION_precision": 0.7377049180327869,
"eval_ORGANIZATION_recall": 0.7758620689655172,
"eval_PERSON_f1": 0.9102564102564101,
"eval_PERSON_number": 152,
"eval_PERSON_precision": 0.8875,
"eval_PERSON_recall": 0.9342105263157895,
"eval_QUANTITY_f1": 0.8253968253968254,
"eval_QUANTITY_number": 30,
"eval_QUANTITY_precision": 0.7878787878787878,
"eval_QUANTITY_recall": 0.8666666666666667,
"eval_TIME_f1": 0.8813559322033899,
"eval_TIME_number": 29,
"eval_TIME_precision": 0.8666666666666667,
"eval_TIME_recall": 0.896551724137931,
"eval_loss": 0.33905231952667236,
"eval_overall_accuracy": 0.9664532650448143,
"eval_overall_f1": 0.8669527896995709,
"eval_overall_precision": 0.8393351800554016,
"eval_overall_recall": 0.8964497041420119,
"eval_runtime": 0.3217,
"eval_samples_per_second": 581.317,
"eval_steps_per_second": 9.326,
"step": 8692
},
{
"epoch": 83.0,
"grad_norm": 0.0005490140756592155,
"learning_rate": 8.500000000000002e-06,
"loss": 0.0003,
"step": 8798
},
{
"epoch": 83.0,
"eval_LOCATION_f1": 0.8648648648648648,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.810126582278481,
"eval_LOCATION_recall": 0.927536231884058,
"eval_ORGANIZATION_f1": 0.7479674796747967,
"eval_ORGANIZATION_number": 58,
"eval_ORGANIZATION_precision": 0.7076923076923077,
"eval_ORGANIZATION_recall": 0.7931034482758621,
"eval_PERSON_f1": 0.9038461538461539,
"eval_PERSON_number": 152,
"eval_PERSON_precision": 0.88125,
"eval_PERSON_recall": 0.9276315789473685,
"eval_QUANTITY_f1": 0.8253968253968254,
"eval_QUANTITY_number": 30,
"eval_QUANTITY_precision": 0.7878787878787878,
"eval_QUANTITY_recall": 0.8666666666666667,
"eval_TIME_f1": 0.8813559322033899,
"eval_TIME_number": 29,
"eval_TIME_precision": 0.8666666666666667,
"eval_TIME_recall": 0.896551724137931,
"eval_loss": 0.348821759223938,
"eval_overall_accuracy": 0.9636363636363636,
"eval_overall_f1": 0.8595744680851063,
"eval_overall_precision": 0.8256130790190735,
"eval_overall_recall": 0.8964497041420119,
"eval_runtime": 0.3214,
"eval_samples_per_second": 581.755,
"eval_steps_per_second": 9.333,
"step": 8798
},
{
"epoch": 84.0,
"grad_norm": 0.0003215703763999045,
"learning_rate": 8.000000000000001e-06,
"loss": 0.0002,
"step": 8904
},
{
"epoch": 84.0,
"eval_LOCATION_f1": 0.870748299319728,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.8205128205128205,
"eval_LOCATION_recall": 0.927536231884058,
"eval_ORGANIZATION_f1": 0.7563025210084033,
"eval_ORGANIZATION_number": 58,
"eval_ORGANIZATION_precision": 0.7377049180327869,
"eval_ORGANIZATION_recall": 0.7758620689655172,
"eval_PERSON_f1": 0.9137380191693291,
"eval_PERSON_number": 152,
"eval_PERSON_precision": 0.8881987577639752,
"eval_PERSON_recall": 0.9407894736842105,
"eval_QUANTITY_f1": 0.8253968253968254,
"eval_QUANTITY_number": 30,
"eval_QUANTITY_precision": 0.7878787878787878,
"eval_QUANTITY_recall": 0.8666666666666667,
"eval_TIME_f1": 0.8813559322033899,
"eval_TIME_number": 29,
"eval_TIME_precision": 0.8666666666666667,
"eval_TIME_recall": 0.896551724137931,
"eval_loss": 0.343229740858078,
"eval_overall_accuracy": 0.9651728553137003,
"eval_overall_f1": 0.8673323823109843,
"eval_overall_precision": 0.837465564738292,
"eval_overall_recall": 0.8994082840236687,
"eval_runtime": 0.3342,
"eval_samples_per_second": 559.576,
"eval_steps_per_second": 8.977,
"step": 8904
},
{
"epoch": 85.0,
"grad_norm": 0.00015092955436557531,
"learning_rate": 7.5e-06,
"loss": 0.0003,
"step": 9010
},
{
"epoch": 85.0,
"eval_LOCATION_f1": 0.8590604026845639,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.8,
"eval_LOCATION_recall": 0.927536231884058,
"eval_ORGANIZATION_f1": 0.7804878048780489,
"eval_ORGANIZATION_number": 58,
"eval_ORGANIZATION_precision": 0.7384615384615385,
"eval_ORGANIZATION_recall": 0.8275862068965517,
"eval_PERSON_f1": 0.9166666666666667,
"eval_PERSON_number": 152,
"eval_PERSON_precision": 0.89375,
"eval_PERSON_recall": 0.9407894736842105,
"eval_QUANTITY_f1": 0.8253968253968254,
"eval_QUANTITY_number": 30,
"eval_QUANTITY_precision": 0.7878787878787878,
"eval_QUANTITY_recall": 0.8666666666666667,
"eval_TIME_f1": 0.8813559322033899,
"eval_TIME_number": 29,
"eval_TIME_precision": 0.8666666666666667,
"eval_TIME_recall": 0.896551724137931,
"eval_loss": 0.34420961141586304,
"eval_overall_accuracy": 0.9654289372599232,
"eval_overall_f1": 0.8696883852691217,
"eval_overall_precision": 0.8342391304347826,
"eval_overall_recall": 0.908284023668639,
"eval_runtime": 0.3181,
"eval_samples_per_second": 587.95,
"eval_steps_per_second": 9.432,
"step": 9010
},
{
"epoch": 86.0,
"grad_norm": 0.0005039689131081104,
"learning_rate": 7.000000000000001e-06,
"loss": 0.0005,
"step": 9116
},
{
"epoch": 86.0,
"eval_LOCATION_f1": 0.8648648648648648,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.810126582278481,
"eval_LOCATION_recall": 0.927536231884058,
"eval_ORGANIZATION_f1": 0.7903225806451614,
"eval_ORGANIZATION_number": 58,
"eval_ORGANIZATION_precision": 0.7424242424242424,
"eval_ORGANIZATION_recall": 0.8448275862068966,
"eval_PERSON_f1": 0.9196141479099678,
"eval_PERSON_number": 152,
"eval_PERSON_precision": 0.89937106918239,
"eval_PERSON_recall": 0.9407894736842105,
"eval_QUANTITY_f1": 0.8253968253968254,
"eval_QUANTITY_number": 30,
"eval_QUANTITY_precision": 0.7878787878787878,
"eval_QUANTITY_recall": 0.8666666666666667,
"eval_TIME_f1": 0.8813559322033899,
"eval_TIME_number": 29,
"eval_TIME_precision": 0.8666666666666667,
"eval_TIME_recall": 0.896551724137931,
"eval_loss": 0.3417365849018097,
"eval_overall_accuracy": 0.9661971830985916,
"eval_overall_f1": 0.873758865248227,
"eval_overall_precision": 0.8392370572207084,
"eval_overall_recall": 0.9112426035502958,
"eval_runtime": 0.3234,
"eval_samples_per_second": 578.156,
"eval_steps_per_second": 9.275,
"step": 9116
},
{
"epoch": 87.0,
"grad_norm": 0.00023389511625282466,
"learning_rate": 6.5000000000000004e-06,
"loss": 0.0002,
"step": 9222
},
{
"epoch": 87.0,
"eval_LOCATION_f1": 0.8648648648648648,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.810126582278481,
"eval_LOCATION_recall": 0.927536231884058,
"eval_ORGANIZATION_f1": 0.7777777777777778,
"eval_ORGANIZATION_number": 58,
"eval_ORGANIZATION_precision": 0.7205882352941176,
"eval_ORGANIZATION_recall": 0.8448275862068966,
"eval_PERSON_f1": 0.9166666666666667,
"eval_PERSON_number": 152,
"eval_PERSON_precision": 0.89375,
"eval_PERSON_recall": 0.9407894736842105,
"eval_QUANTITY_f1": 0.8253968253968254,
"eval_QUANTITY_number": 30,
"eval_QUANTITY_precision": 0.7878787878787878,
"eval_QUANTITY_recall": 0.8666666666666667,
"eval_TIME_f1": 0.8666666666666666,
"eval_TIME_number": 29,
"eval_TIME_precision": 0.8387096774193549,
"eval_TIME_recall": 0.896551724137931,
"eval_loss": 0.3444933593273163,
"eval_overall_accuracy": 0.9654289372599232,
"eval_overall_f1": 0.8688293370944994,
"eval_overall_precision": 0.8301886792452831,
"eval_overall_recall": 0.9112426035502958,
"eval_runtime": 0.319,
"eval_samples_per_second": 586.225,
"eval_steps_per_second": 9.405,
"step": 9222
},
{
"epoch": 88.0,
"grad_norm": 0.0009348023450002074,
"learning_rate": 6e-06,
"loss": 0.0002,
"step": 9328
},
{
"epoch": 88.0,
"eval_LOCATION_f1": 0.8648648648648648,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.810126582278481,
"eval_LOCATION_recall": 0.927536231884058,
"eval_ORGANIZATION_f1": 0.7777777777777778,
"eval_ORGANIZATION_number": 58,
"eval_ORGANIZATION_precision": 0.7205882352941176,
"eval_ORGANIZATION_recall": 0.8448275862068966,
"eval_PERSON_f1": 0.9131832797427653,
"eval_PERSON_number": 152,
"eval_PERSON_precision": 0.8930817610062893,
"eval_PERSON_recall": 0.9342105263157895,
"eval_QUANTITY_f1": 0.8253968253968254,
"eval_QUANTITY_number": 30,
"eval_QUANTITY_precision": 0.7878787878787878,
"eval_QUANTITY_recall": 0.8666666666666667,
"eval_TIME_f1": 0.8666666666666666,
"eval_TIME_number": 29,
"eval_TIME_precision": 0.8387096774193549,
"eval_TIME_recall": 0.896551724137931,
"eval_loss": 0.3449549674987793,
"eval_overall_accuracy": 0.9651728553137003,
"eval_overall_f1": 0.867231638418079,
"eval_overall_precision": 0.8297297297297297,
"eval_overall_recall": 0.908284023668639,
"eval_runtime": 0.3216,
"eval_samples_per_second": 581.43,
"eval_steps_per_second": 9.328,
"step": 9328
},
{
"epoch": 89.0,
"grad_norm": 0.10062725096940994,
"learning_rate": 5.500000000000001e-06,
"loss": 0.0002,
"step": 9434
},
{
"epoch": 89.0,
"eval_LOCATION_f1": 0.8648648648648648,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.810126582278481,
"eval_LOCATION_recall": 0.927536231884058,
"eval_ORGANIZATION_f1": 0.7777777777777778,
"eval_ORGANIZATION_number": 58,
"eval_ORGANIZATION_precision": 0.7205882352941176,
"eval_ORGANIZATION_recall": 0.8448275862068966,
"eval_PERSON_f1": 0.9196141479099678,
"eval_PERSON_number": 152,
"eval_PERSON_precision": 0.89937106918239,
"eval_PERSON_recall": 0.9407894736842105,
"eval_QUANTITY_f1": 0.8253968253968254,
"eval_QUANTITY_number": 30,
"eval_QUANTITY_precision": 0.7878787878787878,
"eval_QUANTITY_recall": 0.8666666666666667,
"eval_TIME_f1": 0.8813559322033899,
"eval_TIME_number": 29,
"eval_TIME_precision": 0.8666666666666667,
"eval_TIME_recall": 0.896551724137931,
"eval_loss": 0.3450436592102051,
"eval_overall_accuracy": 0.9659411011523688,
"eval_overall_f1": 0.8712871287128714,
"eval_overall_precision": 0.8346883468834688,
"eval_overall_recall": 0.9112426035502958,
"eval_runtime": 0.3226,
"eval_samples_per_second": 579.728,
"eval_steps_per_second": 9.3,
"step": 9434
},
{
"epoch": 90.0,
"grad_norm": 0.00016394459817092866,
"learning_rate": 5e-06,
"loss": 0.0002,
"step": 9540
},
{
"epoch": 90.0,
"eval_LOCATION_f1": 0.8648648648648648,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.810126582278481,
"eval_LOCATION_recall": 0.927536231884058,
"eval_ORGANIZATION_f1": 0.7777777777777778,
"eval_ORGANIZATION_number": 58,
"eval_ORGANIZATION_precision": 0.7205882352941176,
"eval_ORGANIZATION_recall": 0.8448275862068966,
"eval_PERSON_f1": 0.9196141479099678,
"eval_PERSON_number": 152,
"eval_PERSON_precision": 0.89937106918239,
"eval_PERSON_recall": 0.9407894736842105,
"eval_QUANTITY_f1": 0.8253968253968254,
"eval_QUANTITY_number": 30,
"eval_QUANTITY_precision": 0.7878787878787878,
"eval_QUANTITY_recall": 0.8666666666666667,
"eval_TIME_f1": 0.8813559322033899,
"eval_TIME_number": 29,
"eval_TIME_precision": 0.8666666666666667,
"eval_TIME_recall": 0.896551724137931,
"eval_loss": 0.3440031111240387,
"eval_overall_accuracy": 0.9661971830985916,
"eval_overall_f1": 0.8712871287128714,
"eval_overall_precision": 0.8346883468834688,
"eval_overall_recall": 0.9112426035502958,
"eval_runtime": 0.3218,
"eval_samples_per_second": 581.062,
"eval_steps_per_second": 9.322,
"step": 9540
},
{
"epoch": 91.0,
"grad_norm": 0.00035388587275519967,
"learning_rate": 4.5e-06,
"loss": 0.0002,
"step": 9646
},
{
"epoch": 91.0,
"eval_LOCATION_f1": 0.8648648648648648,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.810126582278481,
"eval_LOCATION_recall": 0.927536231884058,
"eval_ORGANIZATION_f1": 0.7777777777777778,
"eval_ORGANIZATION_number": 58,
"eval_ORGANIZATION_precision": 0.7205882352941176,
"eval_ORGANIZATION_recall": 0.8448275862068966,
"eval_PERSON_f1": 0.9196141479099678,
"eval_PERSON_number": 152,
"eval_PERSON_precision": 0.89937106918239,
"eval_PERSON_recall": 0.9407894736842105,
"eval_QUANTITY_f1": 0.8253968253968254,
"eval_QUANTITY_number": 30,
"eval_QUANTITY_precision": 0.7878787878787878,
"eval_QUANTITY_recall": 0.8666666666666667,
"eval_TIME_f1": 0.8813559322033899,
"eval_TIME_number": 29,
"eval_TIME_precision": 0.8666666666666667,
"eval_TIME_recall": 0.896551724137931,
"eval_loss": 0.3439503610134125,
"eval_overall_accuracy": 0.9661971830985916,
"eval_overall_f1": 0.8712871287128714,
"eval_overall_precision": 0.8346883468834688,
"eval_overall_recall": 0.9112426035502958,
"eval_runtime": 0.3221,
"eval_samples_per_second": 580.542,
"eval_steps_per_second": 9.314,
"step": 9646
},
{
"epoch": 92.0,
"grad_norm": 0.0005183388711884618,
"learning_rate": 4.000000000000001e-06,
"loss": 0.0002,
"step": 9752
},
{
"epoch": 92.0,
"eval_LOCATION_f1": 0.8648648648648648,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.810126582278481,
"eval_LOCATION_recall": 0.927536231884058,
"eval_ORGANIZATION_f1": 0.7777777777777778,
"eval_ORGANIZATION_number": 58,
"eval_ORGANIZATION_precision": 0.7205882352941176,
"eval_ORGANIZATION_recall": 0.8448275862068966,
"eval_PERSON_f1": 0.9196141479099678,
"eval_PERSON_number": 152,
"eval_PERSON_precision": 0.89937106918239,
"eval_PERSON_recall": 0.9407894736842105,
"eval_QUANTITY_f1": 0.8253968253968254,
"eval_QUANTITY_number": 30,
"eval_QUANTITY_precision": 0.7878787878787878,
"eval_QUANTITY_recall": 0.8666666666666667,
"eval_TIME_f1": 0.8813559322033899,
"eval_TIME_number": 29,
"eval_TIME_precision": 0.8666666666666667,
"eval_TIME_recall": 0.896551724137931,
"eval_loss": 0.34474003314971924,
"eval_overall_accuracy": 0.9661971830985916,
"eval_overall_f1": 0.8712871287128714,
"eval_overall_precision": 0.8346883468834688,
"eval_overall_recall": 0.9112426035502958,
"eval_runtime": 0.3227,
"eval_samples_per_second": 579.512,
"eval_steps_per_second": 9.297,
"step": 9752
},
{
"epoch": 93.0,
"grad_norm": 0.00015504320617765188,
"learning_rate": 3.5000000000000004e-06,
"loss": 0.0004,
"step": 9858
},
{
"epoch": 93.0,
"eval_LOCATION_f1": 0.8648648648648648,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.810126582278481,
"eval_LOCATION_recall": 0.927536231884058,
"eval_ORGANIZATION_f1": 0.765625,
"eval_ORGANIZATION_number": 58,
"eval_ORGANIZATION_precision": 0.7,
"eval_ORGANIZATION_recall": 0.8448275862068966,
"eval_PERSON_f1": 0.9196141479099678,
"eval_PERSON_number": 152,
"eval_PERSON_precision": 0.89937106918239,
"eval_PERSON_recall": 0.9407894736842105,
"eval_QUANTITY_f1": 0.8253968253968254,
"eval_QUANTITY_number": 30,
"eval_QUANTITY_precision": 0.7878787878787878,
"eval_QUANTITY_recall": 0.8666666666666667,
"eval_TIME_f1": 0.8813559322033899,
"eval_TIME_number": 29,
"eval_TIME_precision": 0.8666666666666667,
"eval_TIME_recall": 0.896551724137931,
"eval_loss": 0.34853395819664,
"eval_overall_accuracy": 0.9656850192061459,
"eval_overall_f1": 0.8688293370944994,
"eval_overall_precision": 0.8301886792452831,
"eval_overall_recall": 0.9112426035502958,
"eval_runtime": 0.3252,
"eval_samples_per_second": 575.06,
"eval_steps_per_second": 9.226,
"step": 9858
},
{
"epoch": 94.0,
"grad_norm": 0.0016579556977376342,
"learning_rate": 3e-06,
"loss": 0.0002,
"step": 9964
},
{
"epoch": 94.0,
"eval_LOCATION_f1": 0.870748299319728,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.8205128205128205,
"eval_LOCATION_recall": 0.927536231884058,
"eval_ORGANIZATION_f1": 0.7903225806451614,
"eval_ORGANIZATION_number": 58,
"eval_ORGANIZATION_precision": 0.7424242424242424,
"eval_ORGANIZATION_recall": 0.8448275862068966,
"eval_PERSON_f1": 0.9225806451612903,
"eval_PERSON_number": 152,
"eval_PERSON_precision": 0.9050632911392406,
"eval_PERSON_recall": 0.9407894736842105,
"eval_QUANTITY_f1": 0.8253968253968254,
"eval_QUANTITY_number": 30,
"eval_QUANTITY_precision": 0.7878787878787878,
"eval_QUANTITY_recall": 0.8666666666666667,
"eval_TIME_f1": 0.8813559322033899,
"eval_TIME_number": 29,
"eval_TIME_precision": 0.8666666666666667,
"eval_TIME_recall": 0.896551724137931,
"eval_loss": 0.34736061096191406,
"eval_overall_accuracy": 0.9672215108834827,
"eval_overall_f1": 0.8762446657183499,
"eval_overall_precision": 0.8438356164383561,
"eval_overall_recall": 0.9112426035502958,
"eval_runtime": 0.324,
"eval_samples_per_second": 577.077,
"eval_steps_per_second": 9.258,
"step": 9964
},
{
"epoch": 95.0,
"grad_norm": 0.0002204200136475265,
"learning_rate": 2.5e-06,
"loss": 0.0002,
"step": 10070
},
{
"epoch": 95.0,
"eval_LOCATION_f1": 0.870748299319728,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.8205128205128205,
"eval_LOCATION_recall": 0.927536231884058,
"eval_ORGANIZATION_f1": 0.7903225806451614,
"eval_ORGANIZATION_number": 58,
"eval_ORGANIZATION_precision": 0.7424242424242424,
"eval_ORGANIZATION_recall": 0.8448275862068966,
"eval_PERSON_f1": 0.9225806451612903,
"eval_PERSON_number": 152,
"eval_PERSON_precision": 0.9050632911392406,
"eval_PERSON_recall": 0.9407894736842105,
"eval_QUANTITY_f1": 0.8253968253968254,
"eval_QUANTITY_number": 30,
"eval_QUANTITY_precision": 0.7878787878787878,
"eval_QUANTITY_recall": 0.8666666666666667,
"eval_TIME_f1": 0.8813559322033899,
"eval_TIME_number": 29,
"eval_TIME_precision": 0.8666666666666667,
"eval_TIME_recall": 0.896551724137931,
"eval_loss": 0.3477398753166199,
"eval_overall_accuracy": 0.9669654289372599,
"eval_overall_f1": 0.8762446657183499,
"eval_overall_precision": 0.8438356164383561,
"eval_overall_recall": 0.9112426035502958,
"eval_runtime": 0.3352,
"eval_samples_per_second": 557.803,
"eval_steps_per_second": 8.949,
"step": 10070
},
{
"epoch": 96.0,
"grad_norm": 0.0003840687859337777,
"learning_rate": 2.0000000000000003e-06,
"loss": 0.0002,
"step": 10176
},
{
"epoch": 96.0,
"eval_LOCATION_f1": 0.870748299319728,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.8205128205128205,
"eval_LOCATION_recall": 0.927536231884058,
"eval_ORGANIZATION_f1": 0.7903225806451614,
"eval_ORGANIZATION_number": 58,
"eval_ORGANIZATION_precision": 0.7424242424242424,
"eval_ORGANIZATION_recall": 0.8448275862068966,
"eval_PERSON_f1": 0.9196141479099678,
"eval_PERSON_number": 152,
"eval_PERSON_precision": 0.89937106918239,
"eval_PERSON_recall": 0.9407894736842105,
"eval_QUANTITY_f1": 0.8253968253968254,
"eval_QUANTITY_number": 30,
"eval_QUANTITY_precision": 0.7878787878787878,
"eval_QUANTITY_recall": 0.8666666666666667,
"eval_TIME_f1": 0.8813559322033899,
"eval_TIME_number": 29,
"eval_TIME_precision": 0.8666666666666667,
"eval_TIME_recall": 0.896551724137931,
"eval_loss": 0.34747499227523804,
"eval_overall_accuracy": 0.9669654289372599,
"eval_overall_f1": 0.875,
"eval_overall_precision": 0.8415300546448088,
"eval_overall_recall": 0.9112426035502958,
"eval_runtime": 0.3248,
"eval_samples_per_second": 575.753,
"eval_steps_per_second": 9.237,
"step": 10176
},
{
"epoch": 97.0,
"grad_norm": 0.0001158128070528619,
"learning_rate": 1.5e-06,
"loss": 0.0002,
"step": 10282
},
{
"epoch": 97.0,
"eval_LOCATION_f1": 0.870748299319728,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.8205128205128205,
"eval_LOCATION_recall": 0.927536231884058,
"eval_ORGANIZATION_f1": 0.7903225806451614,
"eval_ORGANIZATION_number": 58,
"eval_ORGANIZATION_precision": 0.7424242424242424,
"eval_ORGANIZATION_recall": 0.8448275862068966,
"eval_PERSON_f1": 0.9196141479099678,
"eval_PERSON_number": 152,
"eval_PERSON_precision": 0.89937106918239,
"eval_PERSON_recall": 0.9407894736842105,
"eval_QUANTITY_f1": 0.8253968253968254,
"eval_QUANTITY_number": 30,
"eval_QUANTITY_precision": 0.7878787878787878,
"eval_QUANTITY_recall": 0.8666666666666667,
"eval_TIME_f1": 0.8813559322033899,
"eval_TIME_number": 29,
"eval_TIME_precision": 0.8666666666666667,
"eval_TIME_recall": 0.896551724137931,
"eval_loss": 0.34782785177230835,
"eval_overall_accuracy": 0.9669654289372599,
"eval_overall_f1": 0.875,
"eval_overall_precision": 0.8415300546448088,
"eval_overall_recall": 0.9112426035502958,
"eval_runtime": 0.3347,
"eval_samples_per_second": 558.788,
"eval_steps_per_second": 8.965,
"step": 10282
},
{
"epoch": 98.0,
"grad_norm": 0.0001685286551946774,
"learning_rate": 1.0000000000000002e-06,
"loss": 0.0001,
"step": 10388
},
{
"epoch": 98.0,
"eval_LOCATION_f1": 0.870748299319728,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.8205128205128205,
"eval_LOCATION_recall": 0.927536231884058,
"eval_ORGANIZATION_f1": 0.7903225806451614,
"eval_ORGANIZATION_number": 58,
"eval_ORGANIZATION_precision": 0.7424242424242424,
"eval_ORGANIZATION_recall": 0.8448275862068966,
"eval_PERSON_f1": 0.9196141479099678,
"eval_PERSON_number": 152,
"eval_PERSON_precision": 0.89937106918239,
"eval_PERSON_recall": 0.9407894736842105,
"eval_QUANTITY_f1": 0.8253968253968254,
"eval_QUANTITY_number": 30,
"eval_QUANTITY_precision": 0.7878787878787878,
"eval_QUANTITY_recall": 0.8666666666666667,
"eval_TIME_f1": 0.8813559322033899,
"eval_TIME_number": 29,
"eval_TIME_precision": 0.8666666666666667,
"eval_TIME_recall": 0.896551724137931,
"eval_loss": 0.3480530083179474,
"eval_overall_accuracy": 0.9669654289372599,
"eval_overall_f1": 0.875,
"eval_overall_precision": 0.8415300546448088,
"eval_overall_recall": 0.9112426035502958,
"eval_runtime": 0.3236,
"eval_samples_per_second": 577.794,
"eval_steps_per_second": 9.269,
"step": 10388
},
{
"epoch": 99.0,
"grad_norm": 0.0004627603921107948,
"learning_rate": 5.000000000000001e-07,
"loss": 0.0003,
"step": 10494
},
{
"epoch": 99.0,
"eval_LOCATION_f1": 0.870748299319728,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.8205128205128205,
"eval_LOCATION_recall": 0.927536231884058,
"eval_ORGANIZATION_f1": 0.7903225806451614,
"eval_ORGANIZATION_number": 58,
"eval_ORGANIZATION_precision": 0.7424242424242424,
"eval_ORGANIZATION_recall": 0.8448275862068966,
"eval_PERSON_f1": 0.9196141479099678,
"eval_PERSON_number": 152,
"eval_PERSON_precision": 0.89937106918239,
"eval_PERSON_recall": 0.9407894736842105,
"eval_QUANTITY_f1": 0.8253968253968254,
"eval_QUANTITY_number": 30,
"eval_QUANTITY_precision": 0.7878787878787878,
"eval_QUANTITY_recall": 0.8666666666666667,
"eval_TIME_f1": 0.8813559322033899,
"eval_TIME_number": 29,
"eval_TIME_precision": 0.8666666666666667,
"eval_TIME_recall": 0.896551724137931,
"eval_loss": 0.3480047881603241,
"eval_overall_accuracy": 0.9669654289372599,
"eval_overall_f1": 0.875,
"eval_overall_precision": 0.8415300546448088,
"eval_overall_recall": 0.9112426035502958,
"eval_runtime": 0.33,
"eval_samples_per_second": 566.586,
"eval_steps_per_second": 9.09,
"step": 10494
},
{
"epoch": 100.0,
"grad_norm": 0.00016238813987001777,
"learning_rate": 0.0,
"loss": 0.0002,
"step": 10600
},
{
"epoch": 100.0,
"eval_LOCATION_f1": 0.870748299319728,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.8205128205128205,
"eval_LOCATION_recall": 0.927536231884058,
"eval_ORGANIZATION_f1": 0.7903225806451614,
"eval_ORGANIZATION_number": 58,
"eval_ORGANIZATION_precision": 0.7424242424242424,
"eval_ORGANIZATION_recall": 0.8448275862068966,
"eval_PERSON_f1": 0.9225806451612903,
"eval_PERSON_number": 152,
"eval_PERSON_precision": 0.9050632911392406,
"eval_PERSON_recall": 0.9407894736842105,
"eval_QUANTITY_f1": 0.8253968253968254,
"eval_QUANTITY_number": 30,
"eval_QUANTITY_precision": 0.7878787878787878,
"eval_QUANTITY_recall": 0.8666666666666667,
"eval_TIME_f1": 0.8813559322033899,
"eval_TIME_number": 29,
"eval_TIME_precision": 0.8666666666666667,
"eval_TIME_recall": 0.896551724137931,
"eval_loss": 0.34784960746765137,
"eval_overall_accuracy": 0.9669654289372599,
"eval_overall_f1": 0.8762446657183499,
"eval_overall_precision": 0.8438356164383561,
"eval_overall_recall": 0.9112426035502958,
"eval_runtime": 0.3263,
"eval_samples_per_second": 573.017,
"eval_steps_per_second": 9.193,
"step": 10600
},
{
"epoch": 100.0,
"step": 10600,
"total_flos": 4488439619319522.0,
"train_loss": 0.00870069551422208,
"train_runtime": 967.5082,
"train_samples_per_second": 174.365,
"train_steps_per_second": 10.956
}
],
"logging_steps": 500,
"max_steps": 10600,
"num_input_tokens_seen": 0,
"num_train_epochs": 100,
"save_steps": 500,
"total_flos": 4488439619319522.0,
"train_batch_size": 16,
"trial_name": null,
"trial_params": null
}