nerugm-pt-pl20-1 / trainer_state.json
apwic's picture
End of training
3db1454 verified
{
"best_metric": null,
"best_model_checkpoint": null,
"epoch": 100.0,
"eval_steps": 500,
"global_step": 10600,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 1.0,
"grad_norm": 1.0272084474563599,
"learning_rate": 4.9500000000000004e-05,
"loss": 0.9918,
"step": 106
},
{
"epoch": 1.0,
"eval_LOCATION_f1": 0.0,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.0,
"eval_LOCATION_recall": 0.0,
"eval_ORGANIZATION_f1": 0.0,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.0,
"eval_ORGANIZATION_recall": 0.0,
"eval_PERSON_f1": 0.047058823529411764,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.23529411764705882,
"eval_PERSON_recall": 0.026143790849673203,
"eval_QUANTITY_f1": 0.0,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.0,
"eval_QUANTITY_recall": 0.0,
"eval_TIME_f1": 0.0588235294117647,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.3333333333333333,
"eval_TIME_recall": 0.03225806451612903,
"eval_loss": 0.5814589858055115,
"eval_overall_accuracy": 0.8387416398315581,
"eval_overall_f1": 0.026315789473684213,
"eval_overall_precision": 0.14705882352941177,
"eval_overall_recall": 0.014450867052023121,
"eval_runtime": 0.3818,
"eval_samples_per_second": 489.811,
"eval_steps_per_second": 7.858,
"step": 106
},
{
"epoch": 2.0,
"grad_norm": 1.5510079860687256,
"learning_rate": 4.9e-05,
"loss": 0.5136,
"step": 212
},
{
"epoch": 2.0,
"eval_LOCATION_f1": 0.07228915662650602,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.21428571428571427,
"eval_LOCATION_recall": 0.043478260869565216,
"eval_ORGANIZATION_f1": 0.02150537634408602,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.03125,
"eval_ORGANIZATION_recall": 0.01639344262295082,
"eval_PERSON_f1": 0.5854922279792746,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.48497854077253216,
"eval_PERSON_recall": 0.738562091503268,
"eval_QUANTITY_f1": 0.0,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.0,
"eval_QUANTITY_recall": 0.0,
"eval_TIME_f1": 0.4776119402985074,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.4444444444444444,
"eval_TIME_recall": 0.5161290322580645,
"eval_loss": 0.3840640187263489,
"eval_overall_accuracy": 0.8872925439682933,
"eval_overall_f1": 0.39642324888226527,
"eval_overall_precision": 0.40923076923076923,
"eval_overall_recall": 0.38439306358381503,
"eval_runtime": 0.3813,
"eval_samples_per_second": 490.398,
"eval_steps_per_second": 7.867,
"step": 212
},
{
"epoch": 3.0,
"grad_norm": 1.2181504964828491,
"learning_rate": 4.85e-05,
"loss": 0.3245,
"step": 318
},
{
"epoch": 3.0,
"eval_LOCATION_f1": 0.6335403726708074,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.5543478260869565,
"eval_LOCATION_recall": 0.7391304347826086,
"eval_ORGANIZATION_f1": 0.4903225806451613,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.40425531914893614,
"eval_ORGANIZATION_recall": 0.6229508196721312,
"eval_PERSON_f1": 0.8121212121212121,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.7570621468926554,
"eval_PERSON_recall": 0.8758169934640523,
"eval_QUANTITY_f1": 0.5128205128205128,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.43478260869565216,
"eval_QUANTITY_recall": 0.625,
"eval_TIME_f1": 0.84375,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.8181818181818182,
"eval_TIME_recall": 0.8709677419354839,
"eval_loss": 0.22633680701255798,
"eval_overall_accuracy": 0.9291553133514986,
"eval_overall_f1": 0.6852791878172589,
"eval_overall_precision": 0.6108597285067874,
"eval_overall_recall": 0.7803468208092486,
"eval_runtime": 0.3827,
"eval_samples_per_second": 488.604,
"eval_steps_per_second": 7.839,
"step": 318
},
{
"epoch": 4.0,
"grad_norm": 1.4188401699066162,
"learning_rate": 4.8e-05,
"loss": 0.2176,
"step": 424
},
{
"epoch": 4.0,
"eval_LOCATION_f1": 0.6744186046511628,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.5631067961165048,
"eval_LOCATION_recall": 0.8405797101449275,
"eval_ORGANIZATION_f1": 0.5333333333333332,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.4864864864864865,
"eval_ORGANIZATION_recall": 0.5901639344262295,
"eval_PERSON_f1": 0.8338368580060423,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.7752808988764045,
"eval_PERSON_recall": 0.9019607843137255,
"eval_QUANTITY_f1": 0.46153846153846156,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.3559322033898305,
"eval_QUANTITY_recall": 0.65625,
"eval_TIME_f1": 0.6578947368421053,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.5555555555555556,
"eval_TIME_recall": 0.8064516129032258,
"eval_loss": 0.19828897714614868,
"eval_overall_accuracy": 0.9298984394352242,
"eval_overall_f1": 0.6906832298136646,
"eval_overall_precision": 0.6056644880174292,
"eval_overall_recall": 0.8034682080924855,
"eval_runtime": 0.3817,
"eval_samples_per_second": 489.958,
"eval_steps_per_second": 7.86,
"step": 424
},
{
"epoch": 5.0,
"grad_norm": 0.8591908812522888,
"learning_rate": 4.75e-05,
"loss": 0.1812,
"step": 530
},
{
"epoch": 5.0,
"eval_LOCATION_f1": 0.7123287671232876,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.6753246753246753,
"eval_LOCATION_recall": 0.7536231884057971,
"eval_ORGANIZATION_f1": 0.625,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.5421686746987951,
"eval_ORGANIZATION_recall": 0.7377049180327869,
"eval_PERSON_f1": 0.8650306748466258,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.815028901734104,
"eval_PERSON_recall": 0.9215686274509803,
"eval_QUANTITY_f1": 0.7222222222222223,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.65,
"eval_QUANTITY_recall": 0.8125,
"eval_TIME_f1": 0.8387096774193549,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.8387096774193549,
"eval_TIME_recall": 0.8387096774193549,
"eval_loss": 0.14980928599834442,
"eval_overall_accuracy": 0.9497151350012385,
"eval_overall_f1": 0.7733333333333333,
"eval_overall_precision": 0.7178217821782178,
"eval_overall_recall": 0.838150289017341,
"eval_runtime": 0.3817,
"eval_samples_per_second": 489.861,
"eval_steps_per_second": 7.859,
"step": 530
},
{
"epoch": 6.0,
"grad_norm": 0.4265460968017578,
"learning_rate": 4.7e-05,
"loss": 0.1571,
"step": 636
},
{
"epoch": 6.0,
"eval_LOCATION_f1": 0.7125,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.6263736263736264,
"eval_LOCATION_recall": 0.8260869565217391,
"eval_ORGANIZATION_f1": 0.620253164556962,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.5051546391752577,
"eval_ORGANIZATION_recall": 0.8032786885245902,
"eval_PERSON_f1": 0.8847352024922119,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.8452380952380952,
"eval_PERSON_recall": 0.9281045751633987,
"eval_QUANTITY_f1": 0.6756756756756757,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.5952380952380952,
"eval_QUANTITY_recall": 0.78125,
"eval_TIME_f1": 0.7536231884057972,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.6842105263157895,
"eval_TIME_recall": 0.8387096774193549,
"eval_loss": 0.15143448114395142,
"eval_overall_accuracy": 0.9464949219717612,
"eval_overall_f1": 0.7647058823529412,
"eval_overall_precision": 0.6857798165137615,
"eval_overall_recall": 0.8641618497109826,
"eval_runtime": 0.381,
"eval_samples_per_second": 490.81,
"eval_steps_per_second": 7.874,
"step": 636
},
{
"epoch": 7.0,
"grad_norm": 0.6821984648704529,
"learning_rate": 4.6500000000000005e-05,
"loss": 0.1435,
"step": 742
},
{
"epoch": 7.0,
"eval_LOCATION_f1": 0.7388535031847134,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.6590909090909091,
"eval_LOCATION_recall": 0.8405797101449275,
"eval_ORGANIZATION_f1": 0.6712328767123288,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.5764705882352941,
"eval_ORGANIZATION_recall": 0.8032786885245902,
"eval_PERSON_f1": 0.8711656441717791,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.8208092485549133,
"eval_PERSON_recall": 0.9281045751633987,
"eval_QUANTITY_f1": 0.641025641025641,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.5434782608695652,
"eval_QUANTITY_recall": 0.78125,
"eval_TIME_f1": 0.8125,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.7878787878787878,
"eval_TIME_recall": 0.8387096774193549,
"eval_loss": 0.15106207132339478,
"eval_overall_accuracy": 0.9497151350012385,
"eval_overall_f1": 0.7782101167315175,
"eval_overall_precision": 0.7058823529411765,
"eval_overall_recall": 0.8670520231213873,
"eval_runtime": 0.3811,
"eval_samples_per_second": 490.727,
"eval_steps_per_second": 7.873,
"step": 742
},
{
"epoch": 8.0,
"grad_norm": 0.5688347220420837,
"learning_rate": 4.600000000000001e-05,
"loss": 0.1354,
"step": 848
},
{
"epoch": 8.0,
"eval_LOCATION_f1": 0.778523489932886,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.725,
"eval_LOCATION_recall": 0.8405797101449275,
"eval_ORGANIZATION_f1": 0.6363636363636364,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.5268817204301075,
"eval_ORGANIZATION_recall": 0.8032786885245902,
"eval_PERSON_f1": 0.8757763975155279,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.834319526627219,
"eval_PERSON_recall": 0.9215686274509803,
"eval_QUANTITY_f1": 0.7123287671232876,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.6341463414634146,
"eval_QUANTITY_recall": 0.8125,
"eval_TIME_f1": 0.7027027027027026,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.6046511627906976,
"eval_TIME_recall": 0.8387096774193549,
"eval_loss": 0.14667640626430511,
"eval_overall_accuracy": 0.9504582610849641,
"eval_overall_f1": 0.7772020725388601,
"eval_overall_precision": 0.704225352112676,
"eval_overall_recall": 0.8670520231213873,
"eval_runtime": 0.3804,
"eval_samples_per_second": 491.557,
"eval_steps_per_second": 7.886,
"step": 848
},
{
"epoch": 9.0,
"grad_norm": 1.076498031616211,
"learning_rate": 4.55e-05,
"loss": 0.1286,
"step": 954
},
{
"epoch": 9.0,
"eval_LOCATION_f1": 0.7295597484276729,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.6444444444444445,
"eval_LOCATION_recall": 0.8405797101449275,
"eval_ORGANIZATION_f1": 0.6716417910447762,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.6164383561643836,
"eval_ORGANIZATION_recall": 0.7377049180327869,
"eval_PERSON_f1": 0.89375,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.8562874251497006,
"eval_PERSON_recall": 0.934640522875817,
"eval_QUANTITY_f1": 0.7222222222222223,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.65,
"eval_QUANTITY_recall": 0.8125,
"eval_TIME_f1": 0.7123287671232876,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.6190476190476191,
"eval_TIME_recall": 0.8387096774193549,
"eval_loss": 0.13916395604610443,
"eval_overall_accuracy": 0.9546693088927422,
"eval_overall_f1": 0.7862796833773087,
"eval_overall_precision": 0.7233009708737864,
"eval_overall_recall": 0.861271676300578,
"eval_runtime": 0.383,
"eval_samples_per_second": 488.209,
"eval_steps_per_second": 7.832,
"step": 954
},
{
"epoch": 10.0,
"grad_norm": 0.7342737317085266,
"learning_rate": 4.5e-05,
"loss": 0.1192,
"step": 1060
},
{
"epoch": 10.0,
"eval_LOCATION_f1": 0.7567567567567568,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7088607594936709,
"eval_LOCATION_recall": 0.8115942028985508,
"eval_ORGANIZATION_f1": 0.6811594202898551,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.6103896103896104,
"eval_ORGANIZATION_recall": 0.7704918032786885,
"eval_PERSON_f1": 0.8785046728971961,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.8392857142857143,
"eval_PERSON_recall": 0.9215686274509803,
"eval_QUANTITY_f1": 0.742857142857143,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.6842105263157895,
"eval_QUANTITY_recall": 0.8125,
"eval_TIME_f1": 0.7936507936507936,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.78125,
"eval_TIME_recall": 0.8064516129032258,
"eval_loss": 0.12648716568946838,
"eval_overall_accuracy": 0.9576418132276443,
"eval_overall_f1": 0.7972972972972973,
"eval_overall_precision": 0.748730964467005,
"eval_overall_recall": 0.8526011560693642,
"eval_runtime": 0.3808,
"eval_samples_per_second": 491.1,
"eval_steps_per_second": 7.879,
"step": 1060
},
{
"epoch": 11.0,
"grad_norm": 0.3874886929988861,
"learning_rate": 4.4500000000000004e-05,
"loss": 0.111,
"step": 1166
},
{
"epoch": 11.0,
"eval_LOCATION_f1": 0.75,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.6867469879518072,
"eval_LOCATION_recall": 0.8260869565217391,
"eval_ORGANIZATION_f1": 0.6666666666666667,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.6081081081081081,
"eval_ORGANIZATION_recall": 0.7377049180327869,
"eval_PERSON_f1": 0.8952380952380952,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.8703703703703703,
"eval_PERSON_recall": 0.9215686274509803,
"eval_QUANTITY_f1": 0.7222222222222223,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.65,
"eval_QUANTITY_recall": 0.8125,
"eval_TIME_f1": 0.8059701492537312,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.75,
"eval_TIME_recall": 0.8709677419354839,
"eval_loss": 0.12904293835163116,
"eval_overall_accuracy": 0.9583849393113698,
"eval_overall_f1": 0.7989203778677463,
"eval_overall_precision": 0.7493670886075949,
"eval_overall_recall": 0.8554913294797688,
"eval_runtime": 0.3855,
"eval_samples_per_second": 485.047,
"eval_steps_per_second": 7.782,
"step": 1166
},
{
"epoch": 12.0,
"grad_norm": 2.021855354309082,
"learning_rate": 4.4000000000000006e-05,
"loss": 0.1107,
"step": 1272
},
{
"epoch": 12.0,
"eval_LOCATION_f1": 0.7945205479452054,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7532467532467533,
"eval_LOCATION_recall": 0.8405797101449275,
"eval_ORGANIZATION_f1": 0.6715328467153285,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.6052631578947368,
"eval_ORGANIZATION_recall": 0.7540983606557377,
"eval_PERSON_f1": 0.8706624605678233,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.8414634146341463,
"eval_PERSON_recall": 0.9019607843137255,
"eval_QUANTITY_f1": 0.7123287671232876,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.6341463414634146,
"eval_QUANTITY_recall": 0.8125,
"eval_TIME_f1": 0.8064516129032258,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.8064516129032258,
"eval_TIME_recall": 0.8064516129032258,
"eval_loss": 0.13058660924434662,
"eval_overall_accuracy": 0.9564032697547684,
"eval_overall_f1": 0.7972789115646259,
"eval_overall_precision": 0.7532133676092545,
"eval_overall_recall": 0.846820809248555,
"eval_runtime": 0.3807,
"eval_samples_per_second": 491.184,
"eval_steps_per_second": 7.88,
"step": 1272
},
{
"epoch": 13.0,
"grad_norm": 0.5758412480354309,
"learning_rate": 4.35e-05,
"loss": 0.102,
"step": 1378
},
{
"epoch": 13.0,
"eval_LOCATION_f1": 0.7619047619047619,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.717948717948718,
"eval_LOCATION_recall": 0.8115942028985508,
"eval_ORGANIZATION_f1": 0.7210884353741497,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.6162790697674418,
"eval_ORGANIZATION_recall": 0.8688524590163934,
"eval_PERSON_f1": 0.88125,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.844311377245509,
"eval_PERSON_recall": 0.9215686274509803,
"eval_QUANTITY_f1": 0.7246376811594203,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.6756756756756757,
"eval_QUANTITY_recall": 0.78125,
"eval_TIME_f1": 0.7999999999999999,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.7647058823529411,
"eval_TIME_recall": 0.8387096774193549,
"eval_loss": 0.1381181925535202,
"eval_overall_accuracy": 0.9576418132276443,
"eval_overall_f1": 0.8048128342245989,
"eval_overall_precision": 0.7487562189054726,
"eval_overall_recall": 0.869942196531792,
"eval_runtime": 0.3792,
"eval_samples_per_second": 493.132,
"eval_steps_per_second": 7.911,
"step": 1378
},
{
"epoch": 14.0,
"grad_norm": 1.8765839338302612,
"learning_rate": 4.3e-05,
"loss": 0.0995,
"step": 1484
},
{
"epoch": 14.0,
"eval_LOCATION_f1": 0.8055555555555556,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7733333333333333,
"eval_LOCATION_recall": 0.8405797101449275,
"eval_ORGANIZATION_f1": 0.7591240875912408,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.6842105263157895,
"eval_ORGANIZATION_recall": 0.8524590163934426,
"eval_PERSON_f1": 0.89937106918239,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.8666666666666667,
"eval_PERSON_recall": 0.934640522875817,
"eval_QUANTITY_f1": 0.7605633802816902,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.6923076923076923,
"eval_QUANTITY_recall": 0.84375,
"eval_TIME_f1": 0.7605633802816901,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.675,
"eval_TIME_recall": 0.8709677419354839,
"eval_loss": 0.1333017796278,
"eval_overall_accuracy": 0.9598711914788209,
"eval_overall_f1": 0.8286099865047234,
"eval_overall_precision": 0.7772151898734178,
"eval_overall_recall": 0.8872832369942196,
"eval_runtime": 0.3856,
"eval_samples_per_second": 484.98,
"eval_steps_per_second": 7.78,
"step": 1484
},
{
"epoch": 15.0,
"grad_norm": 0.3261714577674866,
"learning_rate": 4.25e-05,
"loss": 0.099,
"step": 1590
},
{
"epoch": 15.0,
"eval_LOCATION_f1": 0.7866666666666667,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7283950617283951,
"eval_LOCATION_recall": 0.855072463768116,
"eval_ORGANIZATION_f1": 0.6911764705882353,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.6266666666666667,
"eval_ORGANIZATION_recall": 0.7704918032786885,
"eval_PERSON_f1": 0.8980891719745223,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.8757763975155279,
"eval_PERSON_recall": 0.9215686274509803,
"eval_QUANTITY_f1": 0.7605633802816902,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.6923076923076923,
"eval_QUANTITY_recall": 0.84375,
"eval_TIME_f1": 0.8484848484848486,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.8,
"eval_TIME_recall": 0.9032258064516129,
"eval_loss": 0.13288669288158417,
"eval_overall_accuracy": 0.9598711914788209,
"eval_overall_f1": 0.8195386702849389,
"eval_overall_precision": 0.7723785166240409,
"eval_overall_recall": 0.8728323699421965,
"eval_runtime": 0.3826,
"eval_samples_per_second": 488.811,
"eval_steps_per_second": 7.842,
"step": 1590
},
{
"epoch": 16.0,
"grad_norm": 0.4830576777458191,
"learning_rate": 4.2e-05,
"loss": 0.0931,
"step": 1696
},
{
"epoch": 16.0,
"eval_LOCATION_f1": 0.8082191780821918,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7662337662337663,
"eval_LOCATION_recall": 0.855072463768116,
"eval_ORGANIZATION_f1": 0.6944444444444445,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.6024096385542169,
"eval_ORGANIZATION_recall": 0.819672131147541,
"eval_PERSON_f1": 0.9056603773584905,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.8727272727272727,
"eval_PERSON_recall": 0.9411764705882353,
"eval_QUANTITY_f1": 0.7605633802816902,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.6923076923076923,
"eval_QUANTITY_recall": 0.84375,
"eval_TIME_f1": 0.8253968253968254,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.8125,
"eval_TIME_recall": 0.8387096774193549,
"eval_loss": 0.13907834887504578,
"eval_overall_accuracy": 0.9596234827842457,
"eval_overall_f1": 0.8247978436657681,
"eval_overall_precision": 0.7727272727272727,
"eval_overall_recall": 0.884393063583815,
"eval_runtime": 0.3853,
"eval_samples_per_second": 485.328,
"eval_steps_per_second": 7.786,
"step": 1696
},
{
"epoch": 17.0,
"grad_norm": 0.4928819239139557,
"learning_rate": 4.15e-05,
"loss": 0.0906,
"step": 1802
},
{
"epoch": 17.0,
"eval_LOCATION_f1": 0.7972972972972974,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7468354430379747,
"eval_LOCATION_recall": 0.855072463768116,
"eval_ORGANIZATION_f1": 0.7,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.620253164556962,
"eval_ORGANIZATION_recall": 0.8032786885245902,
"eval_PERSON_f1": 0.8987341772151898,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.8711656441717791,
"eval_PERSON_recall": 0.9281045751633987,
"eval_QUANTITY_f1": 0.7222222222222223,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.65,
"eval_QUANTITY_recall": 0.8125,
"eval_TIME_f1": 0.8181818181818182,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.7714285714285715,
"eval_TIME_recall": 0.8709677419354839,
"eval_loss": 0.12818662822246552,
"eval_overall_accuracy": 0.9598711914788209,
"eval_overall_f1": 0.8167115902964959,
"eval_overall_precision": 0.7651515151515151,
"eval_overall_recall": 0.8757225433526011,
"eval_runtime": 0.3827,
"eval_samples_per_second": 488.583,
"eval_steps_per_second": 7.838,
"step": 1802
},
{
"epoch": 18.0,
"grad_norm": 0.7172600030899048,
"learning_rate": 4.1e-05,
"loss": 0.0856,
"step": 1908
},
{
"epoch": 18.0,
"eval_LOCATION_f1": 0.8055555555555556,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7733333333333333,
"eval_LOCATION_recall": 0.8405797101449275,
"eval_ORGANIZATION_f1": 0.6716417910447762,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.6164383561643836,
"eval_ORGANIZATION_recall": 0.7377049180327869,
"eval_PERSON_f1": 0.8987341772151898,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.8711656441717791,
"eval_PERSON_recall": 0.9281045751633987,
"eval_QUANTITY_f1": 0.7222222222222223,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.65,
"eval_QUANTITY_recall": 0.8125,
"eval_TIME_f1": 0.8059701492537312,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.75,
"eval_TIME_recall": 0.8709677419354839,
"eval_loss": 0.13049036264419556,
"eval_overall_accuracy": 0.9596234827842457,
"eval_overall_f1": 0.8130968622100955,
"eval_overall_precision": 0.7700258397932817,
"eval_overall_recall": 0.861271676300578,
"eval_runtime": 0.3827,
"eval_samples_per_second": 488.581,
"eval_steps_per_second": 7.838,
"step": 1908
},
{
"epoch": 19.0,
"grad_norm": 0.9027535915374756,
"learning_rate": 4.05e-05,
"loss": 0.0862,
"step": 2014
},
{
"epoch": 19.0,
"eval_LOCATION_f1": 0.7916666666666667,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.76,
"eval_LOCATION_recall": 0.8260869565217391,
"eval_ORGANIZATION_f1": 0.6814814814814815,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.6216216216216216,
"eval_ORGANIZATION_recall": 0.7540983606557377,
"eval_PERSON_f1": 0.9113924050632911,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.8834355828220859,
"eval_PERSON_recall": 0.9411764705882353,
"eval_QUANTITY_f1": 0.742857142857143,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.6842105263157895,
"eval_QUANTITY_recall": 0.8125,
"eval_TIME_f1": 0.8615384615384616,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.8235294117647058,
"eval_TIME_recall": 0.9032258064516129,
"eval_loss": 0.12171386927366257,
"eval_overall_accuracy": 0.964082239286599,
"eval_overall_f1": 0.8246575342465753,
"eval_overall_precision": 0.7838541666666666,
"eval_overall_recall": 0.869942196531792,
"eval_runtime": 0.3824,
"eval_samples_per_second": 489.029,
"eval_steps_per_second": 7.845,
"step": 2014
},
{
"epoch": 20.0,
"grad_norm": 0.6771568059921265,
"learning_rate": 4e-05,
"loss": 0.0814,
"step": 2120
},
{
"epoch": 20.0,
"eval_LOCATION_f1": 0.8137931034482757,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7763157894736842,
"eval_LOCATION_recall": 0.855072463768116,
"eval_ORGANIZATION_f1": 0.697986577181208,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.5909090909090909,
"eval_ORGANIZATION_recall": 0.8524590163934426,
"eval_PERSON_f1": 0.9056603773584905,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.8727272727272727,
"eval_PERSON_recall": 0.9411764705882353,
"eval_QUANTITY_f1": 0.742857142857143,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.6842105263157895,
"eval_QUANTITY_recall": 0.8125,
"eval_TIME_f1": 0.8307692307692308,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.7941176470588235,
"eval_TIME_recall": 0.8709677419354839,
"eval_loss": 0.1427459567785263,
"eval_overall_accuracy": 0.958632648005945,
"eval_overall_f1": 0.8246318607764391,
"eval_overall_precision": 0.7680798004987531,
"eval_overall_recall": 0.8901734104046243,
"eval_runtime": 0.3808,
"eval_samples_per_second": 491.039,
"eval_steps_per_second": 7.878,
"step": 2120
},
{
"epoch": 21.0,
"grad_norm": 0.6687225699424744,
"learning_rate": 3.9500000000000005e-05,
"loss": 0.0771,
"step": 2226
},
{
"epoch": 21.0,
"eval_LOCATION_f1": 0.802721088435374,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7564102564102564,
"eval_LOCATION_recall": 0.855072463768116,
"eval_ORGANIZATION_f1": 0.6944444444444445,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.6024096385542169,
"eval_ORGANIZATION_recall": 0.819672131147541,
"eval_PERSON_f1": 0.8902821316614421,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.8554216867469879,
"eval_PERSON_recall": 0.9281045751633987,
"eval_QUANTITY_f1": 0.7123287671232876,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.6341463414634146,
"eval_QUANTITY_recall": 0.8125,
"eval_TIME_f1": 0.782608695652174,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.7105263157894737,
"eval_TIME_recall": 0.8709677419354839,
"eval_loss": 0.14838886260986328,
"eval_overall_accuracy": 0.9564032697547684,
"eval_overall_f1": 0.8085106382978724,
"eval_overall_precision": 0.7487684729064039,
"eval_overall_recall": 0.8786127167630058,
"eval_runtime": 0.3884,
"eval_samples_per_second": 481.488,
"eval_steps_per_second": 7.724,
"step": 2226
},
{
"epoch": 22.0,
"grad_norm": 0.5799835324287415,
"learning_rate": 3.9000000000000006e-05,
"loss": 0.0803,
"step": 2332
},
{
"epoch": 22.0,
"eval_LOCATION_f1": 0.8137931034482757,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7763157894736842,
"eval_LOCATION_recall": 0.855072463768116,
"eval_ORGANIZATION_f1": 0.6923076923076923,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.5684210526315789,
"eval_ORGANIZATION_recall": 0.8852459016393442,
"eval_PERSON_f1": 0.9085173501577287,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.8780487804878049,
"eval_PERSON_recall": 0.9411764705882353,
"eval_QUANTITY_f1": 0.7323943661971831,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.6666666666666666,
"eval_QUANTITY_recall": 0.8125,
"eval_TIME_f1": 0.84375,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.8181818181818182,
"eval_TIME_recall": 0.8709677419354839,
"eval_loss": 0.1494436264038086,
"eval_overall_accuracy": 0.9583849393113698,
"eval_overall_f1": 0.8233731739707836,
"eval_overall_precision": 0.7616707616707616,
"eval_overall_recall": 0.8959537572254336,
"eval_runtime": 0.3837,
"eval_samples_per_second": 487.419,
"eval_steps_per_second": 7.82,
"step": 2332
},
{
"epoch": 23.0,
"grad_norm": 0.6878646612167358,
"learning_rate": 3.85e-05,
"loss": 0.0775,
"step": 2438
},
{
"epoch": 23.0,
"eval_LOCATION_f1": 0.786206896551724,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.75,
"eval_LOCATION_recall": 0.8260869565217391,
"eval_ORGANIZATION_f1": 0.7007299270072993,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.631578947368421,
"eval_ORGANIZATION_recall": 0.7868852459016393,
"eval_PERSON_f1": 0.9015873015873016,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.8765432098765432,
"eval_PERSON_recall": 0.9281045751633987,
"eval_QUANTITY_f1": 0.7323943661971831,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.6666666666666666,
"eval_QUANTITY_recall": 0.8125,
"eval_TIME_f1": 0.8125,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.7878787878787878,
"eval_TIME_recall": 0.8387096774193549,
"eval_loss": 0.1338999718427658,
"eval_overall_accuracy": 0.9621005697299975,
"eval_overall_f1": 0.8169398907103824,
"eval_overall_precision": 0.7746113989637305,
"eval_overall_recall": 0.8641618497109826,
"eval_runtime": 0.386,
"eval_samples_per_second": 484.497,
"eval_steps_per_second": 7.773,
"step": 2438
},
{
"epoch": 24.0,
"grad_norm": 2.1059324741363525,
"learning_rate": 3.8e-05,
"loss": 0.0723,
"step": 2544
},
{
"epoch": 24.0,
"eval_LOCATION_f1": 0.8194444444444444,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7866666666666666,
"eval_LOCATION_recall": 0.855072463768116,
"eval_ORGANIZATION_f1": 0.6766917293233082,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.625,
"eval_ORGANIZATION_recall": 0.7377049180327869,
"eval_PERSON_f1": 0.896551724137931,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.8614457831325302,
"eval_PERSON_recall": 0.934640522875817,
"eval_QUANTITY_f1": 0.7123287671232876,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.6341463414634146,
"eval_QUANTITY_recall": 0.8125,
"eval_TIME_f1": 0.8405797101449276,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.7631578947368421,
"eval_TIME_recall": 0.9354838709677419,
"eval_loss": 0.13374261558055878,
"eval_overall_accuracy": 0.9603666088679713,
"eval_overall_f1": 0.8184281842818428,
"eval_overall_precision": 0.7704081632653061,
"eval_overall_recall": 0.8728323699421965,
"eval_runtime": 0.3878,
"eval_samples_per_second": 482.16,
"eval_steps_per_second": 7.735,
"step": 2544
},
{
"epoch": 25.0,
"grad_norm": 0.4981442391872406,
"learning_rate": 3.7500000000000003e-05,
"loss": 0.0729,
"step": 2650
},
{
"epoch": 25.0,
"eval_LOCATION_f1": 0.8,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7631578947368421,
"eval_LOCATION_recall": 0.8405797101449275,
"eval_ORGANIZATION_f1": 0.7034482758620689,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.6071428571428571,
"eval_ORGANIZATION_recall": 0.8360655737704918,
"eval_PERSON_f1": 0.8987341772151898,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.8711656441717791,
"eval_PERSON_recall": 0.9281045751633987,
"eval_QUANTITY_f1": 0.7123287671232876,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.6341463414634146,
"eval_QUANTITY_recall": 0.8125,
"eval_TIME_f1": 0.823529411764706,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.7567567567567568,
"eval_TIME_recall": 0.9032258064516129,
"eval_loss": 0.13796736299991608,
"eval_overall_accuracy": 0.9616051523408472,
"eval_overall_f1": 0.8165997322623829,
"eval_overall_precision": 0.7605985037406484,
"eval_overall_recall": 0.8815028901734104,
"eval_runtime": 0.3871,
"eval_samples_per_second": 483.14,
"eval_steps_per_second": 7.751,
"step": 2650
},
{
"epoch": 26.0,
"grad_norm": 0.8632038235664368,
"learning_rate": 3.7e-05,
"loss": 0.0694,
"step": 2756
},
{
"epoch": 26.0,
"eval_LOCATION_f1": 0.8194444444444444,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7866666666666666,
"eval_LOCATION_recall": 0.855072463768116,
"eval_ORGANIZATION_f1": 0.6917293233082706,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.6388888888888888,
"eval_ORGANIZATION_recall": 0.7540983606557377,
"eval_PERSON_f1": 0.9056603773584905,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.8727272727272727,
"eval_PERSON_recall": 0.9411764705882353,
"eval_QUANTITY_f1": 0.7222222222222223,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.65,
"eval_QUANTITY_recall": 0.8125,
"eval_TIME_f1": 0.8615384615384616,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.8235294117647058,
"eval_TIME_recall": 0.9032258064516129,
"eval_loss": 0.1314733773469925,
"eval_overall_accuracy": 0.9633391132028735,
"eval_overall_f1": 0.8278688524590163,
"eval_overall_precision": 0.7849740932642487,
"eval_overall_recall": 0.8757225433526011,
"eval_runtime": 0.3825,
"eval_samples_per_second": 488.948,
"eval_steps_per_second": 7.844,
"step": 2756
},
{
"epoch": 27.0,
"grad_norm": 0.6470693945884705,
"learning_rate": 3.65e-05,
"loss": 0.063,
"step": 2862
},
{
"epoch": 27.0,
"eval_LOCATION_f1": 0.8194444444444444,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7866666666666666,
"eval_LOCATION_recall": 0.855072463768116,
"eval_ORGANIZATION_f1": 0.7,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.620253164556962,
"eval_ORGANIZATION_recall": 0.8032786885245902,
"eval_PERSON_f1": 0.896551724137931,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.8614457831325302,
"eval_PERSON_recall": 0.934640522875817,
"eval_QUANTITY_f1": 0.7222222222222223,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.65,
"eval_QUANTITY_recall": 0.8125,
"eval_TIME_f1": 0.8,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.717948717948718,
"eval_TIME_recall": 0.9032258064516129,
"eval_loss": 0.13855965435504913,
"eval_overall_accuracy": 0.9603666088679713,
"eval_overall_f1": 0.8187919463087249,
"eval_overall_precision": 0.7644110275689223,
"eval_overall_recall": 0.8815028901734104,
"eval_runtime": 0.3834,
"eval_samples_per_second": 487.795,
"eval_steps_per_second": 7.826,
"step": 2862
},
{
"epoch": 28.0,
"grad_norm": 1.1696481704711914,
"learning_rate": 3.6e-05,
"loss": 0.0662,
"step": 2968
},
{
"epoch": 28.0,
"eval_LOCATION_f1": 0.7919463087248322,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7375,
"eval_LOCATION_recall": 0.855072463768116,
"eval_ORGANIZATION_f1": 0.6461538461538463,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.6086956521739131,
"eval_ORGANIZATION_recall": 0.6885245901639344,
"eval_PERSON_f1": 0.9113924050632911,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.8834355828220859,
"eval_PERSON_recall": 0.9411764705882353,
"eval_QUANTITY_f1": 0.742857142857143,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.6842105263157895,
"eval_QUANTITY_recall": 0.8125,
"eval_TIME_f1": 0.8,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.717948717948718,
"eval_TIME_recall": 0.9032258064516129,
"eval_loss": 0.1337006390094757,
"eval_overall_accuracy": 0.9591280653950953,
"eval_overall_f1": 0.8136054421768707,
"eval_overall_precision": 0.7686375321336761,
"eval_overall_recall": 0.8641618497109826,
"eval_runtime": 0.3817,
"eval_samples_per_second": 489.934,
"eval_steps_per_second": 7.86,
"step": 2968
},
{
"epoch": 29.0,
"grad_norm": 0.6332246661186218,
"learning_rate": 3.55e-05,
"loss": 0.063,
"step": 3074
},
{
"epoch": 29.0,
"eval_LOCATION_f1": 0.8163265306122449,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7692307692307693,
"eval_LOCATION_recall": 0.8695652173913043,
"eval_ORGANIZATION_f1": 0.6861313868613139,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.618421052631579,
"eval_ORGANIZATION_recall": 0.7704918032786885,
"eval_PERSON_f1": 0.9206349206349207,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.8950617283950617,
"eval_PERSON_recall": 0.9477124183006536,
"eval_QUANTITY_f1": 0.7222222222222223,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.65,
"eval_QUANTITY_recall": 0.8125,
"eval_TIME_f1": 0.8115942028985507,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.7368421052631579,
"eval_TIME_recall": 0.9032258064516129,
"eval_loss": 0.13317342102527618,
"eval_overall_accuracy": 0.9625959871191478,
"eval_overall_f1": 0.8270270270270269,
"eval_overall_precision": 0.7766497461928934,
"eval_overall_recall": 0.884393063583815,
"eval_runtime": 0.3823,
"eval_samples_per_second": 489.147,
"eval_steps_per_second": 7.847,
"step": 3074
},
{
"epoch": 30.0,
"grad_norm": 0.4695894122123718,
"learning_rate": 3.5e-05,
"loss": 0.0611,
"step": 3180
},
{
"epoch": 30.0,
"eval_LOCATION_f1": 0.821917808219178,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7792207792207793,
"eval_LOCATION_recall": 0.8695652173913043,
"eval_ORGANIZATION_f1": 0.6618705035971222,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.5897435897435898,
"eval_ORGANIZATION_recall": 0.7540983606557377,
"eval_PERSON_f1": 0.9148264984227129,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.8841463414634146,
"eval_PERSON_recall": 0.9477124183006536,
"eval_QUANTITY_f1": 0.7222222222222223,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.65,
"eval_QUANTITY_recall": 0.8125,
"eval_TIME_f1": 0.835820895522388,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.7777777777777778,
"eval_TIME_recall": 0.9032258064516129,
"eval_loss": 0.1411614716053009,
"eval_overall_accuracy": 0.9611097349516968,
"eval_overall_f1": 0.8232118758434549,
"eval_overall_precision": 0.7721518987341772,
"eval_overall_recall": 0.8815028901734104,
"eval_runtime": 0.3814,
"eval_samples_per_second": 490.271,
"eval_steps_per_second": 7.865,
"step": 3180
},
{
"epoch": 31.0,
"grad_norm": 0.49676990509033203,
"learning_rate": 3.45e-05,
"loss": 0.0599,
"step": 3286
},
{
"epoch": 31.0,
"eval_LOCATION_f1": 0.8194444444444444,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7866666666666666,
"eval_LOCATION_recall": 0.855072463768116,
"eval_ORGANIZATION_f1": 0.6870229007633588,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.6428571428571429,
"eval_ORGANIZATION_recall": 0.7377049180327869,
"eval_PERSON_f1": 0.9148264984227129,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.8841463414634146,
"eval_PERSON_recall": 0.9477124183006536,
"eval_QUANTITY_f1": 0.7323943661971831,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.6666666666666666,
"eval_QUANTITY_recall": 0.8125,
"eval_TIME_f1": 0.835820895522388,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.7777777777777778,
"eval_TIME_recall": 0.9032258064516129,
"eval_loss": 0.1362539380788803,
"eval_overall_accuracy": 0.9628436958137231,
"eval_overall_f1": 0.8301369863013699,
"eval_overall_precision": 0.7890625,
"eval_overall_recall": 0.8757225433526011,
"eval_runtime": 0.3837,
"eval_samples_per_second": 487.372,
"eval_steps_per_second": 7.819,
"step": 3286
},
{
"epoch": 32.0,
"grad_norm": 0.4171547591686249,
"learning_rate": 3.4000000000000007e-05,
"loss": 0.0587,
"step": 3392
},
{
"epoch": 32.0,
"eval_LOCATION_f1": 0.8108108108108109,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.759493670886076,
"eval_LOCATION_recall": 0.8695652173913043,
"eval_ORGANIZATION_f1": 0.6323529411764707,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.5733333333333334,
"eval_ORGANIZATION_recall": 0.7049180327868853,
"eval_PERSON_f1": 0.8958990536277602,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.8658536585365854,
"eval_PERSON_recall": 0.9281045751633987,
"eval_QUANTITY_f1": 0.7222222222222223,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.65,
"eval_QUANTITY_recall": 0.8125,
"eval_TIME_f1": 0.8059701492537312,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.75,
"eval_TIME_recall": 0.8709677419354839,
"eval_loss": 0.13879260420799255,
"eval_overall_accuracy": 0.9593757740896706,
"eval_overall_f1": 0.8054054054054054,
"eval_overall_precision": 0.7563451776649747,
"eval_overall_recall": 0.861271676300578,
"eval_runtime": 0.383,
"eval_samples_per_second": 488.286,
"eval_steps_per_second": 7.833,
"step": 3392
},
{
"epoch": 33.0,
"grad_norm": 0.9487641453742981,
"learning_rate": 3.35e-05,
"loss": 0.0586,
"step": 3498
},
{
"epoch": 33.0,
"eval_LOCATION_f1": 0.8082191780821918,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7662337662337663,
"eval_LOCATION_recall": 0.855072463768116,
"eval_ORGANIZATION_f1": 0.6617647058823529,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.6,
"eval_ORGANIZATION_recall": 0.7377049180327869,
"eval_PERSON_f1": 0.9015873015873016,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.8765432098765432,
"eval_PERSON_recall": 0.9281045751633987,
"eval_QUANTITY_f1": 0.75,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.675,
"eval_QUANTITY_recall": 0.84375,
"eval_TIME_f1": 0.84375,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.8181818181818182,
"eval_TIME_recall": 0.8709677419354839,
"eval_loss": 0.13592539727687836,
"eval_overall_accuracy": 0.9623482784245727,
"eval_overall_f1": 0.8185538881309687,
"eval_overall_precision": 0.7751937984496124,
"eval_overall_recall": 0.8670520231213873,
"eval_runtime": 0.3847,
"eval_samples_per_second": 486.08,
"eval_steps_per_second": 7.798,
"step": 3498
},
{
"epoch": 34.0,
"grad_norm": 0.36479949951171875,
"learning_rate": 3.3e-05,
"loss": 0.0568,
"step": 3604
},
{
"epoch": 34.0,
"eval_LOCATION_f1": 0.7919463087248322,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7375,
"eval_LOCATION_recall": 0.855072463768116,
"eval_ORGANIZATION_f1": 0.7164179104477612,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.6575342465753424,
"eval_ORGANIZATION_recall": 0.7868852459016393,
"eval_PERSON_f1": 0.9303797468354431,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.901840490797546,
"eval_PERSON_recall": 0.9607843137254902,
"eval_QUANTITY_f1": 0.7605633802816902,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.6923076923076923,
"eval_QUANTITY_recall": 0.84375,
"eval_TIME_f1": 0.782608695652174,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.7105263157894737,
"eval_TIME_recall": 0.8709677419354839,
"eval_loss": 0.14891496300697327,
"eval_overall_accuracy": 0.9621005697299975,
"eval_overall_f1": 0.8335588633288228,
"eval_overall_precision": 0.7837150127226463,
"eval_overall_recall": 0.8901734104046243,
"eval_runtime": 0.3828,
"eval_samples_per_second": 488.486,
"eval_steps_per_second": 7.837,
"step": 3604
},
{
"epoch": 35.0,
"grad_norm": 1.6607528924942017,
"learning_rate": 3.2500000000000004e-05,
"loss": 0.0563,
"step": 3710
},
{
"epoch": 35.0,
"eval_LOCATION_f1": 0.7945205479452054,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7532467532467533,
"eval_LOCATION_recall": 0.8405797101449275,
"eval_ORGANIZATION_f1": 0.7428571428571428,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.6582278481012658,
"eval_ORGANIZATION_recall": 0.8524590163934426,
"eval_PERSON_f1": 0.926517571884984,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.90625,
"eval_PERSON_recall": 0.9477124183006536,
"eval_QUANTITY_f1": 0.7605633802816902,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.6923076923076923,
"eval_QUANTITY_recall": 0.84375,
"eval_TIME_f1": 0.875,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.8484848484848485,
"eval_TIME_recall": 0.9032258064516129,
"eval_loss": 0.13815556466579437,
"eval_overall_accuracy": 0.9633391132028735,
"eval_overall_f1": 0.8446866485013624,
"eval_overall_precision": 0.7989690721649485,
"eval_overall_recall": 0.8959537572254336,
"eval_runtime": 0.3811,
"eval_samples_per_second": 490.694,
"eval_steps_per_second": 7.872,
"step": 3710
},
{
"epoch": 36.0,
"grad_norm": 0.37544718384742737,
"learning_rate": 3.2000000000000005e-05,
"loss": 0.0549,
"step": 3816
},
{
"epoch": 36.0,
"eval_LOCATION_f1": 0.7891156462585034,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7435897435897436,
"eval_LOCATION_recall": 0.8405797101449275,
"eval_ORGANIZATION_f1": 0.7101449275362318,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.6363636363636364,
"eval_ORGANIZATION_recall": 0.8032786885245902,
"eval_PERSON_f1": 0.89937106918239,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.8666666666666667,
"eval_PERSON_recall": 0.934640522875817,
"eval_QUANTITY_f1": 0.7536231884057971,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.7027027027027027,
"eval_QUANTITY_recall": 0.8125,
"eval_TIME_f1": 0.84375,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.8181818181818182,
"eval_TIME_recall": 0.8709677419354839,
"eval_loss": 0.13398179411888123,
"eval_overall_accuracy": 0.9625959871191478,
"eval_overall_f1": 0.8233695652173912,
"eval_overall_precision": 0.7769230769230769,
"eval_overall_recall": 0.8757225433526011,
"eval_runtime": 0.3859,
"eval_samples_per_second": 484.607,
"eval_steps_per_second": 7.774,
"step": 3816
},
{
"epoch": 37.0,
"grad_norm": 1.0679214000701904,
"learning_rate": 3.15e-05,
"loss": 0.0534,
"step": 3922
},
{
"epoch": 37.0,
"eval_LOCATION_f1": 0.8251748251748252,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7972972972972973,
"eval_LOCATION_recall": 0.855072463768116,
"eval_ORGANIZATION_f1": 0.6766917293233082,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.625,
"eval_ORGANIZATION_recall": 0.7377049180327869,
"eval_PERSON_f1": 0.9171974522292994,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.8944099378881988,
"eval_PERSON_recall": 0.9411764705882353,
"eval_QUANTITY_f1": 0.8059701492537314,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.7714285714285715,
"eval_QUANTITY_recall": 0.84375,
"eval_TIME_f1": 0.875,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.8484848484848485,
"eval_TIME_recall": 0.9032258064516129,
"eval_loss": 0.13130351901054382,
"eval_overall_accuracy": 0.9658162001486252,
"eval_overall_f1": 0.8404993065187241,
"eval_overall_precision": 0.808,
"eval_overall_recall": 0.8757225433526011,
"eval_runtime": 0.3837,
"eval_samples_per_second": 487.405,
"eval_steps_per_second": 7.819,
"step": 3922
},
{
"epoch": 38.0,
"grad_norm": 0.24864430725574493,
"learning_rate": 3.1e-05,
"loss": 0.0549,
"step": 4028
},
{
"epoch": 38.0,
"eval_LOCATION_f1": 0.7972972972972974,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7468354430379747,
"eval_LOCATION_recall": 0.855072463768116,
"eval_ORGANIZATION_f1": 0.6412213740458015,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.6,
"eval_ORGANIZATION_recall": 0.6885245901639344,
"eval_PERSON_f1": 0.9177215189873417,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.8895705521472392,
"eval_PERSON_recall": 0.9477124183006536,
"eval_QUANTITY_f1": 0.7222222222222223,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.65,
"eval_QUANTITY_recall": 0.8125,
"eval_TIME_f1": 0.875,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.8484848484848485,
"eval_TIME_recall": 0.9032258064516129,
"eval_loss": 0.13381846249103546,
"eval_overall_accuracy": 0.9616051523408472,
"eval_overall_f1": 0.8207934336525308,
"eval_overall_precision": 0.7792207792207793,
"eval_overall_recall": 0.8670520231213873,
"eval_runtime": 0.3832,
"eval_samples_per_second": 487.955,
"eval_steps_per_second": 7.828,
"step": 4028
},
{
"epoch": 39.0,
"grad_norm": 0.7260211110115051,
"learning_rate": 3.05e-05,
"loss": 0.0503,
"step": 4134
},
{
"epoch": 39.0,
"eval_LOCATION_f1": 0.8137931034482757,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7763157894736842,
"eval_LOCATION_recall": 0.855072463768116,
"eval_ORGANIZATION_f1": 0.6818181818181818,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.6338028169014085,
"eval_ORGANIZATION_recall": 0.7377049180327869,
"eval_PERSON_f1": 0.9206349206349207,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.8950617283950617,
"eval_PERSON_recall": 0.9477124183006536,
"eval_QUANTITY_f1": 0.7714285714285714,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.7105263157894737,
"eval_QUANTITY_recall": 0.84375,
"eval_TIME_f1": 0.84375,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.8181818181818182,
"eval_TIME_recall": 0.8709677419354839,
"eval_loss": 0.13943922519683838,
"eval_overall_accuracy": 0.9635868218974486,
"eval_overall_f1": 0.8347107438016529,
"eval_overall_precision": 0.7973684210526316,
"eval_overall_recall": 0.8757225433526011,
"eval_runtime": 0.3818,
"eval_samples_per_second": 489.726,
"eval_steps_per_second": 7.857,
"step": 4134
},
{
"epoch": 40.0,
"grad_norm": 0.6635225415229797,
"learning_rate": 3e-05,
"loss": 0.0492,
"step": 4240
},
{
"epoch": 40.0,
"eval_LOCATION_f1": 0.8079470198675496,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7439024390243902,
"eval_LOCATION_recall": 0.8840579710144928,
"eval_ORGANIZATION_f1": 0.6515151515151515,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.6056338028169014,
"eval_ORGANIZATION_recall": 0.7049180327868853,
"eval_PERSON_f1": 0.909657320872274,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.8690476190476191,
"eval_PERSON_recall": 0.954248366013072,
"eval_QUANTITY_f1": 0.7714285714285714,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.7105263157894737,
"eval_QUANTITY_recall": 0.84375,
"eval_TIME_f1": 0.8405797101449276,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.7631578947368421,
"eval_TIME_recall": 0.9354838709677419,
"eval_loss": 0.15114636719226837,
"eval_overall_accuracy": 0.9618528610354223,
"eval_overall_f1": 0.8236877523553163,
"eval_overall_precision": 0.7707808564231738,
"eval_overall_recall": 0.884393063583815,
"eval_runtime": 0.3819,
"eval_samples_per_second": 489.6,
"eval_steps_per_second": 7.855,
"step": 4240
},
{
"epoch": 41.0,
"grad_norm": 0.1464150995016098,
"learning_rate": 2.95e-05,
"loss": 0.0489,
"step": 4346
},
{
"epoch": 41.0,
"eval_LOCATION_f1": 0.8108108108108109,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.759493670886076,
"eval_LOCATION_recall": 0.8695652173913043,
"eval_ORGANIZATION_f1": 0.7058823529411764,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.64,
"eval_ORGANIZATION_recall": 0.7868852459016393,
"eval_PERSON_f1": 0.9119496855345912,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.8787878787878788,
"eval_PERSON_recall": 0.9477124183006536,
"eval_QUANTITY_f1": 0.7605633802816902,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.6923076923076923,
"eval_QUANTITY_recall": 0.84375,
"eval_TIME_f1": 0.8923076923076922,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.8529411764705882,
"eval_TIME_recall": 0.9354838709677419,
"eval_loss": 0.14375168085098267,
"eval_overall_accuracy": 0.9648253653703245,
"eval_overall_f1": 0.8373983739837398,
"eval_overall_precision": 0.7882653061224489,
"eval_overall_recall": 0.8930635838150289,
"eval_runtime": 0.3823,
"eval_samples_per_second": 489.175,
"eval_steps_per_second": 7.848,
"step": 4346
},
{
"epoch": 42.0,
"grad_norm": 0.8611084818840027,
"learning_rate": 2.9e-05,
"loss": 0.0484,
"step": 4452
},
{
"epoch": 42.0,
"eval_LOCATION_f1": 0.7891156462585034,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7435897435897436,
"eval_LOCATION_recall": 0.8405797101449275,
"eval_ORGANIZATION_f1": 0.7092198581560285,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.625,
"eval_ORGANIZATION_recall": 0.819672131147541,
"eval_PERSON_f1": 0.9177215189873417,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.8895705521472392,
"eval_PERSON_recall": 0.9477124183006536,
"eval_QUANTITY_f1": 0.7714285714285714,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.7105263157894737,
"eval_QUANTITY_recall": 0.84375,
"eval_TIME_f1": 0.8307692307692308,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.7941176470588235,
"eval_TIME_recall": 0.8709677419354839,
"eval_loss": 0.15438592433929443,
"eval_overall_accuracy": 0.9608620262571216,
"eval_overall_f1": 0.8308525033829499,
"eval_overall_precision": 0.7811704834605598,
"eval_overall_recall": 0.8872832369942196,
"eval_runtime": 0.3851,
"eval_samples_per_second": 485.57,
"eval_steps_per_second": 7.79,
"step": 4452
},
{
"epoch": 43.0,
"grad_norm": 0.7216106653213501,
"learning_rate": 2.8499999999999998e-05,
"loss": 0.0446,
"step": 4558
},
{
"epoch": 43.0,
"eval_LOCATION_f1": 0.8163265306122449,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7692307692307693,
"eval_LOCATION_recall": 0.8695652173913043,
"eval_ORGANIZATION_f1": 0.6456692913385826,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.6212121212121212,
"eval_ORGANIZATION_recall": 0.6721311475409836,
"eval_PERSON_f1": 0.9171974522292994,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.8944099378881988,
"eval_PERSON_recall": 0.9411764705882353,
"eval_QUANTITY_f1": 0.823529411764706,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.7777777777777778,
"eval_QUANTITY_recall": 0.875,
"eval_TIME_f1": 0.90625,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.8787878787878788,
"eval_TIME_recall": 0.9354838709677419,
"eval_loss": 0.13229750096797943,
"eval_overall_accuracy": 0.9643299479811741,
"eval_overall_f1": 0.8388888888888889,
"eval_overall_precision": 0.8074866310160428,
"eval_overall_recall": 0.8728323699421965,
"eval_runtime": 0.3838,
"eval_samples_per_second": 487.289,
"eval_steps_per_second": 7.817,
"step": 4558
},
{
"epoch": 44.0,
"grad_norm": 0.5811746716499329,
"learning_rate": 2.8000000000000003e-05,
"loss": 0.0463,
"step": 4664
},
{
"epoch": 44.0,
"eval_LOCATION_f1": 0.8157894736842105,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7469879518072289,
"eval_LOCATION_recall": 0.8985507246376812,
"eval_ORGANIZATION_f1": 0.7014925373134328,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.6438356164383562,
"eval_ORGANIZATION_recall": 0.7704918032786885,
"eval_PERSON_f1": 0.8987341772151898,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.8711656441717791,
"eval_PERSON_recall": 0.9281045751633987,
"eval_QUANTITY_f1": 0.7323943661971831,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.6666666666666666,
"eval_QUANTITY_recall": 0.8125,
"eval_TIME_f1": 0.8307692307692308,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.7941176470588235,
"eval_TIME_recall": 0.8709677419354839,
"eval_loss": 0.14487981796264648,
"eval_overall_accuracy": 0.9621005697299975,
"eval_overall_f1": 0.8238482384823848,
"eval_overall_precision": 0.7755102040816326,
"eval_overall_recall": 0.8786127167630058,
"eval_runtime": 0.3833,
"eval_samples_per_second": 487.825,
"eval_steps_per_second": 7.826,
"step": 4664
},
{
"epoch": 45.0,
"grad_norm": 0.9379541277885437,
"learning_rate": 2.7500000000000004e-05,
"loss": 0.0457,
"step": 4770
},
{
"epoch": 45.0,
"eval_LOCATION_f1": 0.8378378378378378,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7848101265822784,
"eval_LOCATION_recall": 0.8985507246376812,
"eval_ORGANIZATION_f1": 0.6976744186046512,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.6617647058823529,
"eval_ORGANIZATION_recall": 0.7377049180327869,
"eval_PERSON_f1": 0.9050632911392406,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.8773006134969326,
"eval_PERSON_recall": 0.934640522875817,
"eval_QUANTITY_f1": 0.7999999999999999,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.7368421052631579,
"eval_QUANTITY_recall": 0.875,
"eval_TIME_f1": 0.8484848484848486,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.8,
"eval_TIME_recall": 0.9032258064516129,
"eval_loss": 0.13066914677619934,
"eval_overall_accuracy": 0.9648253653703245,
"eval_overall_f1": 0.839506172839506,
"eval_overall_precision": 0.7989556135770235,
"eval_overall_recall": 0.884393063583815,
"eval_runtime": 0.3832,
"eval_samples_per_second": 488.01,
"eval_steps_per_second": 7.829,
"step": 4770
},
{
"epoch": 46.0,
"grad_norm": 0.38373321294784546,
"learning_rate": 2.7000000000000002e-05,
"loss": 0.0436,
"step": 4876
},
{
"epoch": 46.0,
"eval_LOCATION_f1": 0.8053691275167786,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.75,
"eval_LOCATION_recall": 0.8695652173913043,
"eval_ORGANIZATION_f1": 0.6969696969696969,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.647887323943662,
"eval_ORGANIZATION_recall": 0.7540983606557377,
"eval_PERSON_f1": 0.9085173501577287,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.8780487804878049,
"eval_PERSON_recall": 0.9411764705882353,
"eval_QUANTITY_f1": 0.7999999999999999,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.7368421052631579,
"eval_QUANTITY_recall": 0.875,
"eval_TIME_f1": 0.84375,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.8181818181818182,
"eval_TIME_recall": 0.8709677419354839,
"eval_loss": 0.14025072753429413,
"eval_overall_accuracy": 0.9625959871191478,
"eval_overall_f1": 0.8333333333333334,
"eval_overall_precision": 0.7901554404145078,
"eval_overall_recall": 0.8815028901734104,
"eval_runtime": 0.3836,
"eval_samples_per_second": 487.546,
"eval_steps_per_second": 7.822,
"step": 4876
},
{
"epoch": 47.0,
"grad_norm": 0.8705413937568665,
"learning_rate": 2.6500000000000004e-05,
"loss": 0.0439,
"step": 4982
},
{
"epoch": 47.0,
"eval_LOCATION_f1": 0.821917808219178,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7792207792207793,
"eval_LOCATION_recall": 0.8695652173913043,
"eval_ORGANIZATION_f1": 0.682170542635659,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.6470588235294118,
"eval_ORGANIZATION_recall": 0.7213114754098361,
"eval_PERSON_f1": 0.9177215189873417,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.8895705521472392,
"eval_PERSON_recall": 0.9477124183006536,
"eval_QUANTITY_f1": 0.7999999999999999,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.7368421052631579,
"eval_QUANTITY_recall": 0.875,
"eval_TIME_f1": 0.8571428571428571,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.84375,
"eval_TIME_recall": 0.8709677419354839,
"eval_loss": 0.1442147195339203,
"eval_overall_accuracy": 0.964082239286599,
"eval_overall_f1": 0.8397790055248618,
"eval_overall_precision": 0.8042328042328042,
"eval_overall_recall": 0.8786127167630058,
"eval_runtime": 0.3847,
"eval_samples_per_second": 486.092,
"eval_steps_per_second": 7.798,
"step": 4982
},
{
"epoch": 48.0,
"grad_norm": 0.906028151512146,
"learning_rate": 2.6000000000000002e-05,
"loss": 0.0425,
"step": 5088
},
{
"epoch": 48.0,
"eval_LOCATION_f1": 0.7999999999999999,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7407407407407407,
"eval_LOCATION_recall": 0.8695652173913043,
"eval_ORGANIZATION_f1": 0.7246376811594203,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.6493506493506493,
"eval_ORGANIZATION_recall": 0.819672131147541,
"eval_PERSON_f1": 0.910828025477707,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.8881987577639752,
"eval_PERSON_recall": 0.934640522875817,
"eval_QUANTITY_f1": 0.767123287671233,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.6829268292682927,
"eval_QUANTITY_recall": 0.875,
"eval_TIME_f1": 0.823529411764706,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.7567567567567568,
"eval_TIME_recall": 0.9032258064516129,
"eval_loss": 0.1539994776248932,
"eval_overall_accuracy": 0.9618528610354223,
"eval_overall_f1": 0.8317631224764468,
"eval_overall_precision": 0.7783375314861462,
"eval_overall_recall": 0.8930635838150289,
"eval_runtime": 0.3824,
"eval_samples_per_second": 489.027,
"eval_steps_per_second": 7.845,
"step": 5088
},
{
"epoch": 49.0,
"grad_norm": 0.25983723998069763,
"learning_rate": 2.5500000000000003e-05,
"loss": 0.0446,
"step": 5194
},
{
"epoch": 49.0,
"eval_LOCATION_f1": 0.786206896551724,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.75,
"eval_LOCATION_recall": 0.8260869565217391,
"eval_ORGANIZATION_f1": 0.6865671641791045,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.6301369863013698,
"eval_ORGANIZATION_recall": 0.7540983606557377,
"eval_PERSON_f1": 0.9056603773584905,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.8727272727272727,
"eval_PERSON_recall": 0.9411764705882353,
"eval_QUANTITY_f1": 0.7826086956521738,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.7297297297297297,
"eval_QUANTITY_recall": 0.84375,
"eval_TIME_f1": 0.8387096774193549,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.8387096774193549,
"eval_TIME_recall": 0.8387096774193549,
"eval_loss": 0.14243273437023163,
"eval_overall_accuracy": 0.9630914045082982,
"eval_overall_f1": 0.8241758241758242,
"eval_overall_precision": 0.7853403141361257,
"eval_overall_recall": 0.8670520231213873,
"eval_runtime": 0.3807,
"eval_samples_per_second": 491.159,
"eval_steps_per_second": 7.88,
"step": 5194
},
{
"epoch": 50.0,
"grad_norm": 0.8506327867507935,
"learning_rate": 2.5e-05,
"loss": 0.0409,
"step": 5300
},
{
"epoch": 50.0,
"eval_LOCATION_f1": 0.8275862068965517,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7894736842105263,
"eval_LOCATION_recall": 0.8695652173913043,
"eval_ORGANIZATION_f1": 0.6976744186046512,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.6617647058823529,
"eval_ORGANIZATION_recall": 0.7377049180327869,
"eval_PERSON_f1": 0.9085173501577287,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.8780487804878049,
"eval_PERSON_recall": 0.9411764705882353,
"eval_QUANTITY_f1": 0.7826086956521738,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.7297297297297297,
"eval_QUANTITY_recall": 0.84375,
"eval_TIME_f1": 0.7999999999999999,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.7647058823529411,
"eval_TIME_recall": 0.8387096774193549,
"eval_loss": 0.14614629745483398,
"eval_overall_accuracy": 0.9648253653703245,
"eval_overall_f1": 0.833103448275862,
"eval_overall_precision": 0.7968337730870713,
"eval_overall_recall": 0.8728323699421965,
"eval_runtime": 0.383,
"eval_samples_per_second": 488.264,
"eval_steps_per_second": 7.833,
"step": 5300
},
{
"epoch": 51.0,
"grad_norm": 0.6887333989143372,
"learning_rate": 2.45e-05,
"loss": 0.0419,
"step": 5406
},
{
"epoch": 51.0,
"eval_LOCATION_f1": 0.8108108108108109,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.759493670886076,
"eval_LOCATION_recall": 0.8695652173913043,
"eval_ORGANIZATION_f1": 0.6799999999999999,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.5730337078651685,
"eval_ORGANIZATION_recall": 0.8360655737704918,
"eval_PERSON_f1": 0.9119496855345912,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.8787878787878788,
"eval_PERSON_recall": 0.9477124183006536,
"eval_QUANTITY_f1": 0.7714285714285714,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.7105263157894737,
"eval_QUANTITY_recall": 0.84375,
"eval_TIME_f1": 0.8615384615384616,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.8235294117647058,
"eval_TIME_recall": 0.9032258064516129,
"eval_loss": 0.1532040238380432,
"eval_overall_accuracy": 0.9603666088679713,
"eval_overall_f1": 0.8282290279627165,
"eval_overall_precision": 0.7679012345679013,
"eval_overall_recall": 0.8988439306358381,
"eval_runtime": 0.3837,
"eval_samples_per_second": 487.302,
"eval_steps_per_second": 7.818,
"step": 5406
},
{
"epoch": 52.0,
"grad_norm": 0.8161492347717285,
"learning_rate": 2.4e-05,
"loss": 0.0406,
"step": 5512
},
{
"epoch": 52.0,
"eval_LOCATION_f1": 0.8053691275167786,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.75,
"eval_LOCATION_recall": 0.8695652173913043,
"eval_ORGANIZATION_f1": 0.7164179104477612,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.6575342465753424,
"eval_ORGANIZATION_recall": 0.7868852459016393,
"eval_PERSON_f1": 0.9079365079365078,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.8827160493827161,
"eval_PERSON_recall": 0.934640522875817,
"eval_QUANTITY_f1": 0.823529411764706,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.7777777777777778,
"eval_QUANTITY_recall": 0.875,
"eval_TIME_f1": 0.8484848484848486,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.8,
"eval_TIME_recall": 0.9032258064516129,
"eval_loss": 0.14783500134944916,
"eval_overall_accuracy": 0.9645776566757494,
"eval_overall_f1": 0.8387978142076503,
"eval_overall_precision": 0.7953367875647669,
"eval_overall_recall": 0.8872832369942196,
"eval_runtime": 0.3829,
"eval_samples_per_second": 488.43,
"eval_steps_per_second": 7.836,
"step": 5512
},
{
"epoch": 53.0,
"grad_norm": 0.7052940130233765,
"learning_rate": 2.35e-05,
"loss": 0.0417,
"step": 5618
},
{
"epoch": 53.0,
"eval_LOCATION_f1": 0.802721088435374,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7564102564102564,
"eval_LOCATION_recall": 0.855072463768116,
"eval_ORGANIZATION_f1": 0.6906474820143885,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.6153846153846154,
"eval_ORGANIZATION_recall": 0.7868852459016393,
"eval_PERSON_f1": 0.9240506329113924,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.8957055214723927,
"eval_PERSON_recall": 0.954248366013072,
"eval_QUANTITY_f1": 0.8358208955223881,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.8,
"eval_QUANTITY_recall": 0.875,
"eval_TIME_f1": 0.8387096774193549,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.8387096774193549,
"eval_TIME_recall": 0.8387096774193549,
"eval_loss": 0.1469346284866333,
"eval_overall_accuracy": 0.9645776566757494,
"eval_overall_f1": 0.8399452804377565,
"eval_overall_precision": 0.7974025974025974,
"eval_overall_recall": 0.8872832369942196,
"eval_runtime": 0.3832,
"eval_samples_per_second": 487.973,
"eval_steps_per_second": 7.828,
"step": 5618
},
{
"epoch": 54.0,
"grad_norm": 7.3201823234558105,
"learning_rate": 2.3000000000000003e-05,
"loss": 0.0387,
"step": 5724
},
{
"epoch": 54.0,
"eval_LOCATION_f1": 0.7972972972972974,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7468354430379747,
"eval_LOCATION_recall": 0.855072463768116,
"eval_ORGANIZATION_f1": 0.7218045112781954,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.6666666666666666,
"eval_ORGANIZATION_recall": 0.7868852459016393,
"eval_PERSON_f1": 0.9177215189873417,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.8895705521472392,
"eval_PERSON_recall": 0.9477124183006536,
"eval_QUANTITY_f1": 0.8059701492537314,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.7714285714285715,
"eval_QUANTITY_recall": 0.84375,
"eval_TIME_f1": 0.8181818181818182,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.7714285714285715,
"eval_TIME_recall": 0.8709677419354839,
"eval_loss": 0.1538899838924408,
"eval_overall_accuracy": 0.9650730740648997,
"eval_overall_f1": 0.8383561643835618,
"eval_overall_precision": 0.796875,
"eval_overall_recall": 0.884393063583815,
"eval_runtime": 0.3864,
"eval_samples_per_second": 483.91,
"eval_steps_per_second": 7.763,
"step": 5724
},
{
"epoch": 55.0,
"grad_norm": 0.6526756882667542,
"learning_rate": 2.25e-05,
"loss": 0.0387,
"step": 5830
},
{
"epoch": 55.0,
"eval_LOCATION_f1": 0.7919463087248322,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7375,
"eval_LOCATION_recall": 0.855072463768116,
"eval_ORGANIZATION_f1": 0.6956521739130435,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.6233766233766234,
"eval_ORGANIZATION_recall": 0.7868852459016393,
"eval_PERSON_f1": 0.9177215189873417,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.8895705521472392,
"eval_PERSON_recall": 0.9477124183006536,
"eval_QUANTITY_f1": 0.7605633802816902,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.6923076923076923,
"eval_QUANTITY_recall": 0.84375,
"eval_TIME_f1": 0.8253968253968254,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.8125,
"eval_TIME_recall": 0.8387096774193549,
"eval_loss": 0.14972607791423798,
"eval_overall_accuracy": 0.9621005697299975,
"eval_overall_f1": 0.8276797829036635,
"eval_overall_precision": 0.7800511508951407,
"eval_overall_recall": 0.8815028901734104,
"eval_runtime": 0.3818,
"eval_samples_per_second": 489.724,
"eval_steps_per_second": 7.857,
"step": 5830
},
{
"epoch": 56.0,
"grad_norm": 0.48691311478614807,
"learning_rate": 2.2000000000000003e-05,
"loss": 0.0385,
"step": 5936
},
{
"epoch": 56.0,
"eval_LOCATION_f1": 0.802721088435374,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7564102564102564,
"eval_LOCATION_recall": 0.855072463768116,
"eval_ORGANIZATION_f1": 0.6865671641791045,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.6301369863013698,
"eval_ORGANIZATION_recall": 0.7540983606557377,
"eval_PERSON_f1": 0.9177215189873417,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.8895705521472392,
"eval_PERSON_recall": 0.9477124183006536,
"eval_QUANTITY_f1": 0.7714285714285714,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.7105263157894737,
"eval_QUANTITY_recall": 0.84375,
"eval_TIME_f1": 0.8307692307692308,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.7941176470588235,
"eval_TIME_recall": 0.8709677419354839,
"eval_loss": 0.14442645013332367,
"eval_overall_accuracy": 0.9645776566757494,
"eval_overall_f1": 0.8306010928961748,
"eval_overall_precision": 0.7875647668393783,
"eval_overall_recall": 0.8786127167630058,
"eval_runtime": 0.3823,
"eval_samples_per_second": 489.133,
"eval_steps_per_second": 7.847,
"step": 5936
},
{
"epoch": 57.0,
"grad_norm": 0.5005918145179749,
"learning_rate": 2.15e-05,
"loss": 0.0359,
"step": 6042
},
{
"epoch": 57.0,
"eval_LOCATION_f1": 0.8322147651006713,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.775,
"eval_LOCATION_recall": 0.8985507246376812,
"eval_ORGANIZATION_f1": 0.6511627906976745,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.6176470588235294,
"eval_ORGANIZATION_recall": 0.6885245901639344,
"eval_PERSON_f1": 0.9177215189873417,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.8895705521472392,
"eval_PERSON_recall": 0.9477124183006536,
"eval_QUANTITY_f1": 0.7941176470588235,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.75,
"eval_QUANTITY_recall": 0.84375,
"eval_TIME_f1": 0.84375,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.8181818181818182,
"eval_TIME_recall": 0.8709677419354839,
"eval_loss": 0.14682108163833618,
"eval_overall_accuracy": 0.96556849145405,
"eval_overall_f1": 0.8347107438016529,
"eval_overall_precision": 0.7973684210526316,
"eval_overall_recall": 0.8757225433526011,
"eval_runtime": 0.3819,
"eval_samples_per_second": 489.637,
"eval_steps_per_second": 7.855,
"step": 6042
},
{
"epoch": 58.0,
"grad_norm": 0.40474098920822144,
"learning_rate": 2.1e-05,
"loss": 0.0366,
"step": 6148
},
{
"epoch": 58.0,
"eval_LOCATION_f1": 0.8322147651006713,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.775,
"eval_LOCATION_recall": 0.8985507246376812,
"eval_ORGANIZATION_f1": 0.7014925373134328,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.6438356164383562,
"eval_ORGANIZATION_recall": 0.7704918032786885,
"eval_PERSON_f1": 0.9177215189873417,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.8895705521472392,
"eval_PERSON_recall": 0.9477124183006536,
"eval_QUANTITY_f1": 0.8059701492537314,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.7714285714285715,
"eval_QUANTITY_recall": 0.84375,
"eval_TIME_f1": 0.8125,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.7878787878787878,
"eval_TIME_recall": 0.8387096774193549,
"eval_loss": 0.14990100264549255,
"eval_overall_accuracy": 0.9653207827594749,
"eval_overall_f1": 0.8410958904109589,
"eval_overall_precision": 0.7994791666666666,
"eval_overall_recall": 0.8872832369942196,
"eval_runtime": 0.3831,
"eval_samples_per_second": 488.137,
"eval_steps_per_second": 7.831,
"step": 6148
},
{
"epoch": 59.0,
"grad_norm": 0.5422191619873047,
"learning_rate": 2.05e-05,
"loss": 0.0349,
"step": 6254
},
{
"epoch": 59.0,
"eval_LOCATION_f1": 0.8299319727891156,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.782051282051282,
"eval_LOCATION_recall": 0.8840579710144928,
"eval_ORGANIZATION_f1": 0.7058823529411764,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.64,
"eval_ORGANIZATION_recall": 0.7868852459016393,
"eval_PERSON_f1": 0.9177215189873417,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.8895705521472392,
"eval_PERSON_recall": 0.9477124183006536,
"eval_QUANTITY_f1": 0.7605633802816902,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.6923076923076923,
"eval_QUANTITY_recall": 0.84375,
"eval_TIME_f1": 0.8484848484848486,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.8,
"eval_TIME_recall": 0.9032258064516129,
"eval_loss": 0.15260933339595795,
"eval_overall_accuracy": 0.9653207827594749,
"eval_overall_f1": 0.8396739130434783,
"eval_overall_precision": 0.7923076923076923,
"eval_overall_recall": 0.8930635838150289,
"eval_runtime": 0.3829,
"eval_samples_per_second": 488.41,
"eval_steps_per_second": 7.835,
"step": 6254
},
{
"epoch": 60.0,
"grad_norm": 1.01388680934906,
"learning_rate": 2e-05,
"loss": 0.0358,
"step": 6360
},
{
"epoch": 60.0,
"eval_LOCATION_f1": 0.7947019867549668,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7317073170731707,
"eval_LOCATION_recall": 0.8695652173913043,
"eval_ORGANIZATION_f1": 0.7205882352941175,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.6533333333333333,
"eval_ORGANIZATION_recall": 0.8032786885245902,
"eval_PERSON_f1": 0.9148264984227129,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.8841463414634146,
"eval_PERSON_recall": 0.9477124183006536,
"eval_QUANTITY_f1": 0.7714285714285714,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.7105263157894737,
"eval_QUANTITY_recall": 0.84375,
"eval_TIME_f1": 0.875,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.8484848484848485,
"eval_TIME_recall": 0.9032258064516129,
"eval_loss": 0.15072497725486755,
"eval_overall_accuracy": 0.9653207827594749,
"eval_overall_f1": 0.8373983739837398,
"eval_overall_precision": 0.7882653061224489,
"eval_overall_recall": 0.8930635838150289,
"eval_runtime": 0.3811,
"eval_samples_per_second": 490.737,
"eval_steps_per_second": 7.873,
"step": 6360
},
{
"epoch": 61.0,
"grad_norm": 0.32948485016822815,
"learning_rate": 1.9500000000000003e-05,
"loss": 0.0347,
"step": 6466
},
{
"epoch": 61.0,
"eval_LOCATION_f1": 0.8187919463087248,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7625,
"eval_LOCATION_recall": 0.8840579710144928,
"eval_ORGANIZATION_f1": 0.6917293233082706,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.6388888888888888,
"eval_ORGANIZATION_recall": 0.7540983606557377,
"eval_PERSON_f1": 0.9113924050632911,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.8834355828220859,
"eval_PERSON_recall": 0.9411764705882353,
"eval_QUANTITY_f1": 0.7941176470588235,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.75,
"eval_QUANTITY_recall": 0.84375,
"eval_TIME_f1": 0.8571428571428571,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.84375,
"eval_TIME_recall": 0.8709677419354839,
"eval_loss": 0.1476087123155594,
"eval_overall_accuracy": 0.9635868218974486,
"eval_overall_f1": 0.8367626886145405,
"eval_overall_precision": 0.7963446475195822,
"eval_overall_recall": 0.8815028901734104,
"eval_runtime": 0.3841,
"eval_samples_per_second": 486.827,
"eval_steps_per_second": 7.81,
"step": 6466
},
{
"epoch": 62.0,
"grad_norm": 0.46073493361473083,
"learning_rate": 1.9e-05,
"loss": 0.0339,
"step": 6572
},
{
"epoch": 62.0,
"eval_LOCATION_f1": 0.8243243243243245,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7721518987341772,
"eval_LOCATION_recall": 0.8840579710144928,
"eval_ORGANIZATION_f1": 0.6923076923076924,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.6521739130434783,
"eval_ORGANIZATION_recall": 0.7377049180327869,
"eval_PERSON_f1": 0.9015873015873016,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.8765432098765432,
"eval_PERSON_recall": 0.9281045751633987,
"eval_QUANTITY_f1": 0.8115942028985507,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.7567567567567568,
"eval_QUANTITY_recall": 0.875,
"eval_TIME_f1": 0.8709677419354839,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.8709677419354839,
"eval_TIME_recall": 0.8709677419354839,
"eval_loss": 0.14788304269313812,
"eval_overall_accuracy": 0.9653207827594749,
"eval_overall_f1": 0.8370165745856354,
"eval_overall_precision": 0.8015873015873016,
"eval_overall_recall": 0.8757225433526011,
"eval_runtime": 0.3849,
"eval_samples_per_second": 485.837,
"eval_steps_per_second": 7.794,
"step": 6572
},
{
"epoch": 63.0,
"grad_norm": 0.10588483512401581,
"learning_rate": 1.85e-05,
"loss": 0.035,
"step": 6678
},
{
"epoch": 63.0,
"eval_LOCATION_f1": 0.8187919463087248,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7625,
"eval_LOCATION_recall": 0.8840579710144928,
"eval_ORGANIZATION_f1": 0.7313432835820896,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.6712328767123288,
"eval_ORGANIZATION_recall": 0.8032786885245902,
"eval_PERSON_f1": 0.910828025477707,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.8881987577639752,
"eval_PERSON_recall": 0.934640522875817,
"eval_QUANTITY_f1": 0.7941176470588235,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.75,
"eval_QUANTITY_recall": 0.84375,
"eval_TIME_f1": 0.8709677419354839,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.8709677419354839,
"eval_TIME_recall": 0.8709677419354839,
"eval_loss": 0.15484392642974854,
"eval_overall_accuracy": 0.9653207827594749,
"eval_overall_f1": 0.844566712517194,
"eval_overall_precision": 0.8057742782152231,
"eval_overall_recall": 0.8872832369942196,
"eval_runtime": 0.3828,
"eval_samples_per_second": 488.461,
"eval_steps_per_second": 7.836,
"step": 6678
},
{
"epoch": 64.0,
"grad_norm": 0.8103458881378174,
"learning_rate": 1.8e-05,
"loss": 0.0316,
"step": 6784
},
{
"epoch": 64.0,
"eval_LOCATION_f1": 0.8187919463087248,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7625,
"eval_LOCATION_recall": 0.8840579710144928,
"eval_ORGANIZATION_f1": 0.7007299270072993,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.631578947368421,
"eval_ORGANIZATION_recall": 0.7868852459016393,
"eval_PERSON_f1": 0.9182389937106918,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.8848484848484849,
"eval_PERSON_recall": 0.954248366013072,
"eval_QUANTITY_f1": 0.7826086956521738,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.7297297297297297,
"eval_QUANTITY_recall": 0.84375,
"eval_TIME_f1": 0.8387096774193549,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.8387096774193549,
"eval_TIME_recall": 0.8387096774193549,
"eval_loss": 0.15606780350208282,
"eval_overall_accuracy": 0.9633391132028735,
"eval_overall_f1": 0.8380952380952382,
"eval_overall_precision": 0.7917737789203085,
"eval_overall_recall": 0.8901734104046243,
"eval_runtime": 0.3816,
"eval_samples_per_second": 490.038,
"eval_steps_per_second": 7.862,
"step": 6784
},
{
"epoch": 65.0,
"grad_norm": 0.6652474403381348,
"learning_rate": 1.75e-05,
"loss": 0.0339,
"step": 6890
},
{
"epoch": 65.0,
"eval_LOCATION_f1": 0.8299319727891156,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.782051282051282,
"eval_LOCATION_recall": 0.8840579710144928,
"eval_ORGANIZATION_f1": 0.6762589928057554,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.6025641025641025,
"eval_ORGANIZATION_recall": 0.7704918032786885,
"eval_PERSON_f1": 0.9009584664536741,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.88125,
"eval_PERSON_recall": 0.9215686274509803,
"eval_QUANTITY_f1": 0.8059701492537314,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.7714285714285715,
"eval_QUANTITY_recall": 0.84375,
"eval_TIME_f1": 0.8709677419354839,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.8709677419354839,
"eval_TIME_recall": 0.8709677419354839,
"eval_loss": 0.15425816178321838,
"eval_overall_accuracy": 0.9625959871191478,
"eval_overall_f1": 0.8324175824175825,
"eval_overall_precision": 0.7931937172774869,
"eval_overall_recall": 0.8757225433526011,
"eval_runtime": 0.382,
"eval_samples_per_second": 489.487,
"eval_steps_per_second": 7.853,
"step": 6890
},
{
"epoch": 66.0,
"grad_norm": 0.5202561616897583,
"learning_rate": 1.7000000000000003e-05,
"loss": 0.0333,
"step": 6996
},
{
"epoch": 66.0,
"eval_LOCATION_f1": 0.7837837837837838,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7341772151898734,
"eval_LOCATION_recall": 0.8405797101449275,
"eval_ORGANIZATION_f1": 0.7218045112781954,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.6666666666666666,
"eval_ORGANIZATION_recall": 0.7868852459016393,
"eval_PERSON_f1": 0.9119496855345912,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.8787878787878788,
"eval_PERSON_recall": 0.9477124183006536,
"eval_QUANTITY_f1": 0.7941176470588235,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.75,
"eval_QUANTITY_recall": 0.84375,
"eval_TIME_f1": 0.7999999999999999,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.7647058823529411,
"eval_TIME_recall": 0.8387096774193549,
"eval_loss": 0.1552451103925705,
"eval_overall_accuracy": 0.9645776566757494,
"eval_overall_f1": 0.8306010928961748,
"eval_overall_precision": 0.7875647668393783,
"eval_overall_recall": 0.8786127167630058,
"eval_runtime": 0.3837,
"eval_samples_per_second": 487.312,
"eval_steps_per_second": 7.818,
"step": 6996
},
{
"epoch": 67.0,
"grad_norm": 0.638265073299408,
"learning_rate": 1.65e-05,
"loss": 0.0328,
"step": 7102
},
{
"epoch": 67.0,
"eval_LOCATION_f1": 0.8053691275167786,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.75,
"eval_LOCATION_recall": 0.8695652173913043,
"eval_ORGANIZATION_f1": 0.7313432835820896,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.6712328767123288,
"eval_ORGANIZATION_recall": 0.8032786885245902,
"eval_PERSON_f1": 0.9206349206349207,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.8950617283950617,
"eval_PERSON_recall": 0.9477124183006536,
"eval_QUANTITY_f1": 0.7826086956521738,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.7297297297297297,
"eval_QUANTITY_recall": 0.84375,
"eval_TIME_f1": 0.8387096774193549,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.8387096774193549,
"eval_TIME_recall": 0.8387096774193549,
"eval_loss": 0.1508781760931015,
"eval_overall_accuracy": 0.9660639088432004,
"eval_overall_f1": 0.8422496570644717,
"eval_overall_precision": 0.8015665796344648,
"eval_overall_recall": 0.8872832369942196,
"eval_runtime": 0.3832,
"eval_samples_per_second": 488.055,
"eval_steps_per_second": 7.83,
"step": 7102
},
{
"epoch": 68.0,
"grad_norm": 0.06523913145065308,
"learning_rate": 1.6000000000000003e-05,
"loss": 0.0305,
"step": 7208
},
{
"epoch": 68.0,
"eval_LOCATION_f1": 0.8108108108108109,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.759493670886076,
"eval_LOCATION_recall": 0.8695652173913043,
"eval_ORGANIZATION_f1": 0.7313432835820896,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.6712328767123288,
"eval_ORGANIZATION_recall": 0.8032786885245902,
"eval_PERSON_f1": 0.9044585987261147,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.8819875776397516,
"eval_PERSON_recall": 0.9281045751633987,
"eval_QUANTITY_f1": 0.75,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.675,
"eval_QUANTITY_recall": 0.84375,
"eval_TIME_f1": 0.8181818181818182,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.7714285714285715,
"eval_TIME_recall": 0.8709677419354839,
"eval_loss": 0.1613590270280838,
"eval_overall_accuracy": 0.9628436958137231,
"eval_overall_f1": 0.8310626702997275,
"eval_overall_precision": 0.7860824742268041,
"eval_overall_recall": 0.8815028901734104,
"eval_runtime": 0.3829,
"eval_samples_per_second": 488.339,
"eval_steps_per_second": 7.834,
"step": 7208
},
{
"epoch": 69.0,
"grad_norm": 0.5326893329620361,
"learning_rate": 1.55e-05,
"loss": 0.0331,
"step": 7314
},
{
"epoch": 69.0,
"eval_LOCATION_f1": 0.8493150684931507,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.8051948051948052,
"eval_LOCATION_recall": 0.8985507246376812,
"eval_ORGANIZATION_f1": 0.7076923076923076,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.6666666666666666,
"eval_ORGANIZATION_recall": 0.7540983606557377,
"eval_PERSON_f1": 0.9079365079365078,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.8827160493827161,
"eval_PERSON_recall": 0.934640522875817,
"eval_QUANTITY_f1": 0.8059701492537314,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.7714285714285715,
"eval_QUANTITY_recall": 0.84375,
"eval_TIME_f1": 0.8888888888888888,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.875,
"eval_TIME_recall": 0.9032258064516129,
"eval_loss": 0.15333113074302673,
"eval_overall_accuracy": 0.9648253653703245,
"eval_overall_f1": 0.8488210818307905,
"eval_overall_precision": 0.816,
"eval_overall_recall": 0.884393063583815,
"eval_runtime": 0.3863,
"eval_samples_per_second": 484.124,
"eval_steps_per_second": 7.767,
"step": 7314
},
{
"epoch": 70.0,
"grad_norm": 0.4003902077674866,
"learning_rate": 1.5e-05,
"loss": 0.0325,
"step": 7420
},
{
"epoch": 70.0,
"eval_LOCATION_f1": 0.8356164383561644,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7922077922077922,
"eval_LOCATION_recall": 0.8840579710144928,
"eval_ORGANIZATION_f1": 0.6861313868613139,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.618421052631579,
"eval_ORGANIZATION_recall": 0.7704918032786885,
"eval_PERSON_f1": 0.9113924050632911,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.8834355828220859,
"eval_PERSON_recall": 0.9411764705882353,
"eval_QUANTITY_f1": 0.7941176470588235,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.75,
"eval_QUANTITY_recall": 0.84375,
"eval_TIME_f1": 0.8571428571428571,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.84375,
"eval_TIME_recall": 0.8709677419354839,
"eval_loss": 0.15659072995185852,
"eval_overall_accuracy": 0.964082239286599,
"eval_overall_f1": 0.8383561643835618,
"eval_overall_precision": 0.796875,
"eval_overall_recall": 0.884393063583815,
"eval_runtime": 0.3887,
"eval_samples_per_second": 481.037,
"eval_steps_per_second": 7.717,
"step": 7420
},
{
"epoch": 71.0,
"grad_norm": 0.27532684803009033,
"learning_rate": 1.45e-05,
"loss": 0.0284,
"step": 7526
},
{
"epoch": 71.0,
"eval_LOCATION_f1": 0.8053691275167786,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.75,
"eval_LOCATION_recall": 0.8695652173913043,
"eval_ORGANIZATION_f1": 0.7153284671532848,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.6447368421052632,
"eval_ORGANIZATION_recall": 0.8032786885245902,
"eval_PERSON_f1": 0.9142857142857143,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.8888888888888888,
"eval_PERSON_recall": 0.9411764705882353,
"eval_QUANTITY_f1": 0.823529411764706,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.7777777777777778,
"eval_QUANTITY_recall": 0.875,
"eval_TIME_f1": 0.8387096774193549,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.8387096774193549,
"eval_TIME_recall": 0.8387096774193549,
"eval_loss": 0.15998543798923492,
"eval_overall_accuracy": 0.9648253653703245,
"eval_overall_f1": 0.8399452804377565,
"eval_overall_precision": 0.7974025974025974,
"eval_overall_recall": 0.8872832369942196,
"eval_runtime": 0.3818,
"eval_samples_per_second": 489.784,
"eval_steps_per_second": 7.858,
"step": 7526
},
{
"epoch": 72.0,
"grad_norm": 0.470971941947937,
"learning_rate": 1.4000000000000001e-05,
"loss": 0.0323,
"step": 7632
},
{
"epoch": 72.0,
"eval_LOCATION_f1": 0.8243243243243245,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7721518987341772,
"eval_LOCATION_recall": 0.8840579710144928,
"eval_ORGANIZATION_f1": 0.7067669172932329,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.6527777777777778,
"eval_ORGANIZATION_recall": 0.7704918032786885,
"eval_PERSON_f1": 0.8987341772151898,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.8711656441717791,
"eval_PERSON_recall": 0.9281045751633987,
"eval_QUANTITY_f1": 0.7826086956521738,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.7297297297297297,
"eval_QUANTITY_recall": 0.84375,
"eval_TIME_f1": 0.8064516129032258,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.8064516129032258,
"eval_TIME_recall": 0.8064516129032258,
"eval_loss": 0.15766850113868713,
"eval_overall_accuracy": 0.9638345305920237,
"eval_overall_f1": 0.8296703296703297,
"eval_overall_precision": 0.7905759162303665,
"eval_overall_recall": 0.8728323699421965,
"eval_runtime": 0.382,
"eval_samples_per_second": 489.473,
"eval_steps_per_second": 7.853,
"step": 7632
},
{
"epoch": 73.0,
"grad_norm": 0.8524491190910339,
"learning_rate": 1.3500000000000001e-05,
"loss": 0.0289,
"step": 7738
},
{
"epoch": 73.0,
"eval_LOCATION_f1": 0.8108108108108109,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.759493670886076,
"eval_LOCATION_recall": 0.8695652173913043,
"eval_ORGANIZATION_f1": 0.676470588235294,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.6133333333333333,
"eval_ORGANIZATION_recall": 0.7540983606557377,
"eval_PERSON_f1": 0.9148264984227129,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.8841463414634146,
"eval_PERSON_recall": 0.9477124183006536,
"eval_QUANTITY_f1": 0.8059701492537314,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.7714285714285715,
"eval_QUANTITY_recall": 0.84375,
"eval_TIME_f1": 0.8387096774193549,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.8387096774193549,
"eval_TIME_recall": 0.8387096774193549,
"eval_loss": 0.1593465507030487,
"eval_overall_accuracy": 0.9643299479811741,
"eval_overall_f1": 0.8328767123287673,
"eval_overall_precision": 0.7916666666666666,
"eval_overall_recall": 0.8786127167630058,
"eval_runtime": 0.3839,
"eval_samples_per_second": 487.123,
"eval_steps_per_second": 7.815,
"step": 7738
},
{
"epoch": 74.0,
"grad_norm": 0.5028882026672363,
"learning_rate": 1.3000000000000001e-05,
"loss": 0.0295,
"step": 7844
},
{
"epoch": 74.0,
"eval_LOCATION_f1": 0.8378378378378378,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7848101265822784,
"eval_LOCATION_recall": 0.8985507246376812,
"eval_ORGANIZATION_f1": 0.6567164179104478,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.6027397260273972,
"eval_ORGANIZATION_recall": 0.7213114754098361,
"eval_PERSON_f1": 0.9050632911392406,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.8773006134969326,
"eval_PERSON_recall": 0.934640522875817,
"eval_QUANTITY_f1": 0.7826086956521738,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.7297297297297297,
"eval_QUANTITY_recall": 0.84375,
"eval_TIME_f1": 0.8125,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.7878787878787878,
"eval_TIME_recall": 0.8387096774193549,
"eval_loss": 0.16330695152282715,
"eval_overall_accuracy": 0.9633391132028735,
"eval_overall_f1": 0.8262653898768809,
"eval_overall_precision": 0.7844155844155845,
"eval_overall_recall": 0.8728323699421965,
"eval_runtime": 0.3841,
"eval_samples_per_second": 486.881,
"eval_steps_per_second": 7.811,
"step": 7844
},
{
"epoch": 75.0,
"grad_norm": 0.5104759931564331,
"learning_rate": 1.25e-05,
"loss": 0.0274,
"step": 7950
},
{
"epoch": 75.0,
"eval_LOCATION_f1": 0.8435374149659864,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7948717948717948,
"eval_LOCATION_recall": 0.8985507246376812,
"eval_ORGANIZATION_f1": 0.6356589147286822,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.6029411764705882,
"eval_ORGANIZATION_recall": 0.6721311475409836,
"eval_PERSON_f1": 0.910828025477707,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.8881987577639752,
"eval_PERSON_recall": 0.934640522875817,
"eval_QUANTITY_f1": 0.7941176470588235,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.75,
"eval_QUANTITY_recall": 0.84375,
"eval_TIME_f1": 0.8125,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.7878787878787878,
"eval_TIME_recall": 0.8387096774193549,
"eval_loss": 0.16056643426418304,
"eval_overall_accuracy": 0.9643299479811741,
"eval_overall_f1": 0.8282548476454293,
"eval_overall_precision": 0.7952127659574468,
"eval_overall_recall": 0.8641618497109826,
"eval_runtime": 0.38,
"eval_samples_per_second": 492.112,
"eval_steps_per_second": 7.895,
"step": 7950
},
{
"epoch": 76.0,
"grad_norm": 1.8361543416976929,
"learning_rate": 1.2e-05,
"loss": 0.0292,
"step": 8056
},
{
"epoch": 76.0,
"eval_LOCATION_f1": 0.8322147651006713,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.775,
"eval_LOCATION_recall": 0.8985507246376812,
"eval_ORGANIZATION_f1": 0.676470588235294,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.6133333333333333,
"eval_ORGANIZATION_recall": 0.7540983606557377,
"eval_PERSON_f1": 0.9177215189873417,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.8895705521472392,
"eval_PERSON_recall": 0.9477124183006536,
"eval_QUANTITY_f1": 0.8059701492537314,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.7714285714285715,
"eval_QUANTITY_recall": 0.84375,
"eval_TIME_f1": 0.8064516129032258,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.8064516129032258,
"eval_TIME_recall": 0.8064516129032258,
"eval_loss": 0.16704599559307098,
"eval_overall_accuracy": 0.9643299479811741,
"eval_overall_f1": 0.8356164383561644,
"eval_overall_precision": 0.7942708333333334,
"eval_overall_recall": 0.8815028901734104,
"eval_runtime": 0.3798,
"eval_samples_per_second": 492.394,
"eval_steps_per_second": 7.899,
"step": 8056
},
{
"epoch": 77.0,
"grad_norm": 0.2984037697315216,
"learning_rate": 1.1500000000000002e-05,
"loss": 0.0271,
"step": 8162
},
{
"epoch": 77.0,
"eval_LOCATION_f1": 0.8243243243243245,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7721518987341772,
"eval_LOCATION_recall": 0.8840579710144928,
"eval_ORGANIZATION_f1": 0.676470588235294,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.6133333333333333,
"eval_ORGANIZATION_recall": 0.7540983606557377,
"eval_PERSON_f1": 0.9050632911392406,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.8773006134969326,
"eval_PERSON_recall": 0.934640522875817,
"eval_QUANTITY_f1": 0.7941176470588235,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.75,
"eval_QUANTITY_recall": 0.84375,
"eval_TIME_f1": 0.8181818181818182,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.7714285714285715,
"eval_TIME_recall": 0.8709677419354839,
"eval_loss": 0.16829800605773926,
"eval_overall_accuracy": 0.9645776566757494,
"eval_overall_f1": 0.8283378746594006,
"eval_overall_precision": 0.7835051546391752,
"eval_overall_recall": 0.8786127167630058,
"eval_runtime": 0.382,
"eval_samples_per_second": 489.498,
"eval_steps_per_second": 7.853,
"step": 8162
},
{
"epoch": 78.0,
"grad_norm": 0.5857195258140564,
"learning_rate": 1.1000000000000001e-05,
"loss": 0.0281,
"step": 8268
},
{
"epoch": 78.0,
"eval_LOCATION_f1": 0.8333333333333333,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.8,
"eval_LOCATION_recall": 0.8695652173913043,
"eval_ORGANIZATION_f1": 0.6616541353383459,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.6111111111111112,
"eval_ORGANIZATION_recall": 0.7213114754098361,
"eval_PERSON_f1": 0.9050632911392406,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.8773006134969326,
"eval_PERSON_recall": 0.934640522875817,
"eval_QUANTITY_f1": 0.7826086956521738,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.7297297297297297,
"eval_QUANTITY_recall": 0.84375,
"eval_TIME_f1": 0.8571428571428571,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.84375,
"eval_TIME_recall": 0.8709677419354839,
"eval_loss": 0.16350550949573517,
"eval_overall_accuracy": 0.9635868218974486,
"eval_overall_f1": 0.8303448275862069,
"eval_overall_precision": 0.7941952506596306,
"eval_overall_recall": 0.869942196531792,
"eval_runtime": 0.3811,
"eval_samples_per_second": 490.73,
"eval_steps_per_second": 7.873,
"step": 8268
},
{
"epoch": 79.0,
"grad_norm": 0.4454423785209656,
"learning_rate": 1.05e-05,
"loss": 0.026,
"step": 8374
},
{
"epoch": 79.0,
"eval_LOCATION_f1": 0.8391608391608392,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.8108108108108109,
"eval_LOCATION_recall": 0.8695652173913043,
"eval_ORGANIZATION_f1": 0.6865671641791045,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.6301369863013698,
"eval_ORGANIZATION_recall": 0.7540983606557377,
"eval_PERSON_f1": 0.910828025477707,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.8881987577639752,
"eval_PERSON_recall": 0.934640522875817,
"eval_QUANTITY_f1": 0.7941176470588235,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.75,
"eval_QUANTITY_recall": 0.84375,
"eval_TIME_f1": 0.8064516129032258,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.8064516129032258,
"eval_TIME_recall": 0.8064516129032258,
"eval_loss": 0.15963782370090485,
"eval_overall_accuracy": 0.9653207827594749,
"eval_overall_f1": 0.8349514563106797,
"eval_overall_precision": 0.8026666666666666,
"eval_overall_recall": 0.869942196531792,
"eval_runtime": 0.3813,
"eval_samples_per_second": 490.451,
"eval_steps_per_second": 7.868,
"step": 8374
},
{
"epoch": 80.0,
"grad_norm": 0.3006572425365448,
"learning_rate": 1e-05,
"loss": 0.0265,
"step": 8480
},
{
"epoch": 80.0,
"eval_LOCATION_f1": 0.8053691275167786,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.75,
"eval_LOCATION_recall": 0.8695652173913043,
"eval_ORGANIZATION_f1": 0.7058823529411764,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.64,
"eval_ORGANIZATION_recall": 0.7868852459016393,
"eval_PERSON_f1": 0.9177215189873417,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.8895705521472392,
"eval_PERSON_recall": 0.9477124183006536,
"eval_QUANTITY_f1": 0.7714285714285714,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.7105263157894737,
"eval_QUANTITY_recall": 0.84375,
"eval_TIME_f1": 0.8125,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.7878787878787878,
"eval_TIME_recall": 0.8387096774193549,
"eval_loss": 0.1699979156255722,
"eval_overall_accuracy": 0.9633391132028735,
"eval_overall_f1": 0.8326530612244898,
"eval_overall_precision": 0.7866323907455013,
"eval_overall_recall": 0.884393063583815,
"eval_runtime": 0.387,
"eval_samples_per_second": 483.167,
"eval_steps_per_second": 7.751,
"step": 8480
},
{
"epoch": 81.0,
"grad_norm": 0.3541398346424103,
"learning_rate": 9.5e-06,
"loss": 0.0262,
"step": 8586
},
{
"epoch": 81.0,
"eval_LOCATION_f1": 0.8299319727891156,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.782051282051282,
"eval_LOCATION_recall": 0.8840579710144928,
"eval_ORGANIZATION_f1": 0.7014925373134328,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.6438356164383562,
"eval_ORGANIZATION_recall": 0.7704918032786885,
"eval_PERSON_f1": 0.9142857142857143,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.8888888888888888,
"eval_PERSON_recall": 0.9411764705882353,
"eval_QUANTITY_f1": 0.7826086956521738,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.7297297297297297,
"eval_QUANTITY_recall": 0.84375,
"eval_TIME_f1": 0.8125,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.7878787878787878,
"eval_TIME_recall": 0.8387096774193549,
"eval_loss": 0.16345323622226715,
"eval_overall_accuracy": 0.9643299479811741,
"eval_overall_f1": 0.8367626886145405,
"eval_overall_precision": 0.7963446475195822,
"eval_overall_recall": 0.8815028901734104,
"eval_runtime": 0.3803,
"eval_samples_per_second": 491.719,
"eval_steps_per_second": 7.889,
"step": 8586
},
{
"epoch": 82.0,
"grad_norm": 0.7298364043235779,
"learning_rate": 9e-06,
"loss": 0.0275,
"step": 8692
},
{
"epoch": 82.0,
"eval_LOCATION_f1": 0.8187919463087248,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7625,
"eval_LOCATION_recall": 0.8840579710144928,
"eval_ORGANIZATION_f1": 0.711111111111111,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.6486486486486487,
"eval_ORGANIZATION_recall": 0.7868852459016393,
"eval_PERSON_f1": 0.9090909090909091,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.8734939759036144,
"eval_PERSON_recall": 0.9477124183006536,
"eval_QUANTITY_f1": 0.7714285714285714,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.7105263157894737,
"eval_QUANTITY_recall": 0.84375,
"eval_TIME_f1": 0.7999999999999999,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.7647058823529411,
"eval_TIME_recall": 0.8387096774193549,
"eval_loss": 0.1723509579896927,
"eval_overall_accuracy": 0.9628436958137231,
"eval_overall_f1": 0.8319783197831978,
"eval_overall_precision": 0.7831632653061225,
"eval_overall_recall": 0.8872832369942196,
"eval_runtime": 0.3814,
"eval_samples_per_second": 490.283,
"eval_steps_per_second": 7.866,
"step": 8692
},
{
"epoch": 83.0,
"grad_norm": 0.17061911523342133,
"learning_rate": 8.500000000000002e-06,
"loss": 0.0268,
"step": 8798
},
{
"epoch": 83.0,
"eval_LOCATION_f1": 0.8299319727891156,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.782051282051282,
"eval_LOCATION_recall": 0.8840579710144928,
"eval_ORGANIZATION_f1": 0.7014925373134328,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.6438356164383562,
"eval_ORGANIZATION_recall": 0.7704918032786885,
"eval_PERSON_f1": 0.910828025477707,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.8881987577639752,
"eval_PERSON_recall": 0.934640522875817,
"eval_QUANTITY_f1": 0.7714285714285714,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.7105263157894737,
"eval_QUANTITY_recall": 0.84375,
"eval_TIME_f1": 0.8125,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.7878787878787878,
"eval_TIME_recall": 0.8387096774193549,
"eval_loss": 0.1663985699415207,
"eval_overall_accuracy": 0.9625959871191478,
"eval_overall_f1": 0.8340192043895747,
"eval_overall_precision": 0.793733681462141,
"eval_overall_recall": 0.8786127167630058,
"eval_runtime": 0.3818,
"eval_samples_per_second": 489.836,
"eval_steps_per_second": 7.858,
"step": 8798
},
{
"epoch": 84.0,
"grad_norm": 1.4881929159164429,
"learning_rate": 8.000000000000001e-06,
"loss": 0.0256,
"step": 8904
},
{
"epoch": 84.0,
"eval_LOCATION_f1": 0.8275862068965517,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7894736842105263,
"eval_LOCATION_recall": 0.8695652173913043,
"eval_ORGANIZATION_f1": 0.7164179104477612,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.6575342465753424,
"eval_ORGANIZATION_recall": 0.7868852459016393,
"eval_PERSON_f1": 0.910828025477707,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.8881987577639752,
"eval_PERSON_recall": 0.934640522875817,
"eval_QUANTITY_f1": 0.8059701492537314,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.7714285714285715,
"eval_QUANTITY_recall": 0.84375,
"eval_TIME_f1": 0.8125,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.7878787878787878,
"eval_TIME_recall": 0.8387096774193549,
"eval_loss": 0.16189546883106232,
"eval_overall_accuracy": 0.9653207827594749,
"eval_overall_f1": 0.8397790055248618,
"eval_overall_precision": 0.8042328042328042,
"eval_overall_recall": 0.8786127167630058,
"eval_runtime": 0.3841,
"eval_samples_per_second": 486.853,
"eval_steps_per_second": 7.81,
"step": 8904
},
{
"epoch": 85.0,
"grad_norm": 0.3548848628997803,
"learning_rate": 7.5e-06,
"loss": 0.0265,
"step": 9010
},
{
"epoch": 85.0,
"eval_LOCATION_f1": 0.8133333333333332,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7530864197530864,
"eval_LOCATION_recall": 0.8840579710144928,
"eval_ORGANIZATION_f1": 0.7175572519083969,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.6714285714285714,
"eval_ORGANIZATION_recall": 0.7704918032786885,
"eval_PERSON_f1": 0.9142857142857143,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.8888888888888888,
"eval_PERSON_recall": 0.9411764705882353,
"eval_QUANTITY_f1": 0.8059701492537314,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.7714285714285715,
"eval_QUANTITY_recall": 0.84375,
"eval_TIME_f1": 0.8125,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.7878787878787878,
"eval_TIME_recall": 0.8387096774193549,
"eval_loss": 0.1618238389492035,
"eval_overall_accuracy": 0.96556849145405,
"eval_overall_f1": 0.8390646492434664,
"eval_overall_precision": 0.800524934383202,
"eval_overall_recall": 0.8815028901734104,
"eval_runtime": 0.3818,
"eval_samples_per_second": 489.793,
"eval_steps_per_second": 7.858,
"step": 9010
},
{
"epoch": 86.0,
"grad_norm": 1.7985620498657227,
"learning_rate": 7.000000000000001e-06,
"loss": 0.0256,
"step": 9116
},
{
"epoch": 86.0,
"eval_LOCATION_f1": 0.8133333333333332,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7530864197530864,
"eval_LOCATION_recall": 0.8840579710144928,
"eval_ORGANIZATION_f1": 0.7014925373134328,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.6438356164383562,
"eval_ORGANIZATION_recall": 0.7704918032786885,
"eval_PERSON_f1": 0.9148264984227129,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.8841463414634146,
"eval_PERSON_recall": 0.9477124183006536,
"eval_QUANTITY_f1": 0.7714285714285714,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.7105263157894737,
"eval_QUANTITY_recall": 0.84375,
"eval_TIME_f1": 0.8125,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.7878787878787878,
"eval_TIME_recall": 0.8387096774193549,
"eval_loss": 0.16945821046829224,
"eval_overall_accuracy": 0.9635868218974486,
"eval_overall_f1": 0.8326530612244898,
"eval_overall_precision": 0.7866323907455013,
"eval_overall_recall": 0.884393063583815,
"eval_runtime": 0.381,
"eval_samples_per_second": 490.822,
"eval_steps_per_second": 7.874,
"step": 9116
},
{
"epoch": 87.0,
"grad_norm": 2.4566051959991455,
"learning_rate": 6.5000000000000004e-06,
"loss": 0.027,
"step": 9222
},
{
"epoch": 87.0,
"eval_LOCATION_f1": 0.8435374149659864,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7948717948717948,
"eval_LOCATION_recall": 0.8985507246376812,
"eval_ORGANIZATION_f1": 0.6969696969696969,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.647887323943662,
"eval_ORGANIZATION_recall": 0.7540983606557377,
"eval_PERSON_f1": 0.9142857142857143,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.8888888888888888,
"eval_PERSON_recall": 0.9411764705882353,
"eval_QUANTITY_f1": 0.8059701492537314,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.7714285714285715,
"eval_QUANTITY_recall": 0.84375,
"eval_TIME_f1": 0.8125,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.7878787878787878,
"eval_TIME_recall": 0.8387096774193549,
"eval_loss": 0.16637147963047028,
"eval_overall_accuracy": 0.9650730740648997,
"eval_overall_f1": 0.8413793103448276,
"eval_overall_precision": 0.8047493403693932,
"eval_overall_recall": 0.8815028901734104,
"eval_runtime": 0.382,
"eval_samples_per_second": 489.521,
"eval_steps_per_second": 7.853,
"step": 9222
},
{
"epoch": 88.0,
"grad_norm": 0.17908763885498047,
"learning_rate": 6e-06,
"loss": 0.0249,
"step": 9328
},
{
"epoch": 88.0,
"eval_LOCATION_f1": 0.8435374149659864,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7948717948717948,
"eval_LOCATION_recall": 0.8985507246376812,
"eval_ORGANIZATION_f1": 0.6969696969696969,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.647887323943662,
"eval_ORGANIZATION_recall": 0.7540983606557377,
"eval_PERSON_f1": 0.9182389937106918,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.8848484848484849,
"eval_PERSON_recall": 0.954248366013072,
"eval_QUANTITY_f1": 0.8059701492537314,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.7714285714285715,
"eval_QUANTITY_recall": 0.84375,
"eval_TIME_f1": 0.84375,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.8181818181818182,
"eval_TIME_recall": 0.8709677419354839,
"eval_loss": 0.1701187640428543,
"eval_overall_accuracy": 0.96556849145405,
"eval_overall_f1": 0.8461538461538461,
"eval_overall_precision": 0.806282722513089,
"eval_overall_recall": 0.8901734104046243,
"eval_runtime": 0.3825,
"eval_samples_per_second": 488.883,
"eval_steps_per_second": 7.843,
"step": 9328
},
{
"epoch": 89.0,
"grad_norm": 0.9025946855545044,
"learning_rate": 5.500000000000001e-06,
"loss": 0.0247,
"step": 9434
},
{
"epoch": 89.0,
"eval_LOCATION_f1": 0.8378378378378378,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7848101265822784,
"eval_LOCATION_recall": 0.8985507246376812,
"eval_ORGANIZATION_f1": 0.712121212121212,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.6619718309859155,
"eval_ORGANIZATION_recall": 0.7704918032786885,
"eval_PERSON_f1": 0.9142857142857143,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.8888888888888888,
"eval_PERSON_recall": 0.9411764705882353,
"eval_QUANTITY_f1": 0.8059701492537314,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.7714285714285715,
"eval_QUANTITY_recall": 0.84375,
"eval_TIME_f1": 0.8125,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.7878787878787878,
"eval_TIME_recall": 0.8387096774193549,
"eval_loss": 0.1655082106590271,
"eval_overall_accuracy": 0.9653207827594749,
"eval_overall_f1": 0.8429752066115701,
"eval_overall_precision": 0.8052631578947368,
"eval_overall_recall": 0.884393063583815,
"eval_runtime": 0.3811,
"eval_samples_per_second": 490.73,
"eval_steps_per_second": 7.873,
"step": 9434
},
{
"epoch": 90.0,
"grad_norm": 1.3243649005889893,
"learning_rate": 5e-06,
"loss": 0.0235,
"step": 9540
},
{
"epoch": 90.0,
"eval_LOCATION_f1": 0.8378378378378378,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7848101265822784,
"eval_LOCATION_recall": 0.8985507246376812,
"eval_ORGANIZATION_f1": 0.7164179104477612,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.6575342465753424,
"eval_ORGANIZATION_recall": 0.7868852459016393,
"eval_PERSON_f1": 0.9142857142857143,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.8888888888888888,
"eval_PERSON_recall": 0.9411764705882353,
"eval_QUANTITY_f1": 0.7941176470588235,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.75,
"eval_QUANTITY_recall": 0.84375,
"eval_TIME_f1": 0.7999999999999999,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.7647058823529411,
"eval_TIME_recall": 0.8387096774193549,
"eval_loss": 0.17127062380313873,
"eval_overall_accuracy": 0.9645776566757494,
"eval_overall_f1": 0.8410958904109589,
"eval_overall_precision": 0.7994791666666666,
"eval_overall_recall": 0.8872832369942196,
"eval_runtime": 0.3794,
"eval_samples_per_second": 492.85,
"eval_steps_per_second": 7.907,
"step": 9540
},
{
"epoch": 91.0,
"grad_norm": 0.2453767955303192,
"learning_rate": 4.5e-06,
"loss": 0.0246,
"step": 9646
},
{
"epoch": 91.0,
"eval_LOCATION_f1": 0.8243243243243245,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7721518987341772,
"eval_LOCATION_recall": 0.8840579710144928,
"eval_ORGANIZATION_f1": 0.7164179104477612,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.6575342465753424,
"eval_ORGANIZATION_recall": 0.7868852459016393,
"eval_PERSON_f1": 0.9142857142857143,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.8888888888888888,
"eval_PERSON_recall": 0.9411764705882353,
"eval_QUANTITY_f1": 0.8358208955223881,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.8,
"eval_QUANTITY_recall": 0.875,
"eval_TIME_f1": 0.8307692307692308,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.7941176470588235,
"eval_TIME_recall": 0.8709677419354839,
"eval_loss": 0.1665855497121811,
"eval_overall_accuracy": 0.9660639088432004,
"eval_overall_f1": 0.8449931412894376,
"eval_overall_precision": 0.804177545691906,
"eval_overall_recall": 0.8901734104046243,
"eval_runtime": 0.3828,
"eval_samples_per_second": 488.477,
"eval_steps_per_second": 7.837,
"step": 9646
},
{
"epoch": 92.0,
"grad_norm": 1.269940733909607,
"learning_rate": 4.000000000000001e-06,
"loss": 0.0236,
"step": 9752
},
{
"epoch": 92.0,
"eval_LOCATION_f1": 0.8299319727891156,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.782051282051282,
"eval_LOCATION_recall": 0.8840579710144928,
"eval_ORGANIZATION_f1": 0.7164179104477612,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.6575342465753424,
"eval_ORGANIZATION_recall": 0.7868852459016393,
"eval_PERSON_f1": 0.9142857142857143,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.8888888888888888,
"eval_PERSON_recall": 0.9411764705882353,
"eval_QUANTITY_f1": 0.8059701492537314,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.7714285714285715,
"eval_QUANTITY_recall": 0.84375,
"eval_TIME_f1": 0.8307692307692308,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.7941176470588235,
"eval_TIME_recall": 0.8709677419354839,
"eval_loss": 0.16694949567317963,
"eval_overall_accuracy": 0.9660639088432004,
"eval_overall_f1": 0.8434065934065934,
"eval_overall_precision": 0.8036649214659686,
"eval_overall_recall": 0.8872832369942196,
"eval_runtime": 0.3845,
"eval_samples_per_second": 486.384,
"eval_steps_per_second": 7.803,
"step": 9752
},
{
"epoch": 93.0,
"grad_norm": 5.042428016662598,
"learning_rate": 3.5000000000000004e-06,
"loss": 0.0258,
"step": 9858
},
{
"epoch": 93.0,
"eval_LOCATION_f1": 0.8435374149659864,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7948717948717948,
"eval_LOCATION_recall": 0.8985507246376812,
"eval_ORGANIZATION_f1": 0.7058823529411764,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.64,
"eval_ORGANIZATION_recall": 0.7868852459016393,
"eval_PERSON_f1": 0.9142857142857143,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.8888888888888888,
"eval_PERSON_recall": 0.9411764705882353,
"eval_QUANTITY_f1": 0.8358208955223881,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.8,
"eval_QUANTITY_recall": 0.875,
"eval_TIME_f1": 0.7999999999999999,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.7647058823529411,
"eval_TIME_recall": 0.8387096774193549,
"eval_loss": 0.16739746928215027,
"eval_overall_accuracy": 0.9653207827594749,
"eval_overall_f1": 0.8438356164383563,
"eval_overall_precision": 0.8020833333333334,
"eval_overall_recall": 0.8901734104046243,
"eval_runtime": 0.3873,
"eval_samples_per_second": 482.841,
"eval_steps_per_second": 7.746,
"step": 9858
},
{
"epoch": 94.0,
"grad_norm": 0.5611863732337952,
"learning_rate": 3e-06,
"loss": 0.0234,
"step": 9964
},
{
"epoch": 94.0,
"eval_LOCATION_f1": 0.8378378378378378,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7848101265822784,
"eval_LOCATION_recall": 0.8985507246376812,
"eval_ORGANIZATION_f1": 0.7058823529411764,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.64,
"eval_ORGANIZATION_recall": 0.7868852459016393,
"eval_PERSON_f1": 0.9142857142857143,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.8888888888888888,
"eval_PERSON_recall": 0.9411764705882353,
"eval_QUANTITY_f1": 0.8358208955223881,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.8,
"eval_QUANTITY_recall": 0.875,
"eval_TIME_f1": 0.7999999999999999,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.7647058823529411,
"eval_TIME_recall": 0.8387096774193549,
"eval_loss": 0.16788025200366974,
"eval_overall_accuracy": 0.9658162001486252,
"eval_overall_f1": 0.8426812585499317,
"eval_overall_precision": 0.8,
"eval_overall_recall": 0.8901734104046243,
"eval_runtime": 0.3818,
"eval_samples_per_second": 489.745,
"eval_steps_per_second": 7.857,
"step": 9964
},
{
"epoch": 95.0,
"grad_norm": 0.447412371635437,
"learning_rate": 2.5e-06,
"loss": 0.0241,
"step": 10070
},
{
"epoch": 95.0,
"eval_LOCATION_f1": 0.8378378378378378,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7848101265822784,
"eval_LOCATION_recall": 0.8985507246376812,
"eval_ORGANIZATION_f1": 0.7058823529411764,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.64,
"eval_ORGANIZATION_recall": 0.7868852459016393,
"eval_PERSON_f1": 0.9142857142857143,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.8888888888888888,
"eval_PERSON_recall": 0.9411764705882353,
"eval_QUANTITY_f1": 0.7826086956521738,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.7297297297297297,
"eval_QUANTITY_recall": 0.84375,
"eval_TIME_f1": 0.7999999999999999,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.7647058823529411,
"eval_TIME_recall": 0.8387096774193549,
"eval_loss": 0.16969862580299377,
"eval_overall_accuracy": 0.9643299479811741,
"eval_overall_f1": 0.8376534788540245,
"eval_overall_precision": 0.7932816537467701,
"eval_overall_recall": 0.8872832369942196,
"eval_runtime": 0.3808,
"eval_samples_per_second": 491.035,
"eval_steps_per_second": 7.878,
"step": 10070
},
{
"epoch": 96.0,
"grad_norm": 0.7546741962432861,
"learning_rate": 2.0000000000000003e-06,
"loss": 0.0235,
"step": 10176
},
{
"epoch": 96.0,
"eval_LOCATION_f1": 0.8243243243243245,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7721518987341772,
"eval_LOCATION_recall": 0.8840579710144928,
"eval_ORGANIZATION_f1": 0.711111111111111,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.6486486486486487,
"eval_ORGANIZATION_recall": 0.7868852459016393,
"eval_PERSON_f1": 0.9142857142857143,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.8888888888888888,
"eval_PERSON_recall": 0.9411764705882353,
"eval_QUANTITY_f1": 0.8059701492537314,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.7714285714285715,
"eval_QUANTITY_recall": 0.84375,
"eval_TIME_f1": 0.7999999999999999,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.7647058823529411,
"eval_TIME_recall": 0.8387096774193549,
"eval_loss": 0.1665157824754715,
"eval_overall_accuracy": 0.9650730740648997,
"eval_overall_f1": 0.8383561643835618,
"eval_overall_precision": 0.796875,
"eval_overall_recall": 0.884393063583815,
"eval_runtime": 0.3816,
"eval_samples_per_second": 489.992,
"eval_steps_per_second": 7.861,
"step": 10176
},
{
"epoch": 97.0,
"grad_norm": 0.45943042635917664,
"learning_rate": 1.5e-06,
"loss": 0.0238,
"step": 10282
},
{
"epoch": 97.0,
"eval_LOCATION_f1": 0.8187919463087248,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7625,
"eval_LOCATION_recall": 0.8840579710144928,
"eval_ORGANIZATION_f1": 0.7067669172932329,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.6527777777777778,
"eval_ORGANIZATION_recall": 0.7704918032786885,
"eval_PERSON_f1": 0.9142857142857143,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.8888888888888888,
"eval_PERSON_recall": 0.9411764705882353,
"eval_QUANTITY_f1": 0.7826086956521738,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.7297297297297297,
"eval_QUANTITY_recall": 0.84375,
"eval_TIME_f1": 0.7999999999999999,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.7647058823529411,
"eval_TIME_recall": 0.8387096774193549,
"eval_loss": 0.16720008850097656,
"eval_overall_accuracy": 0.9653207827594749,
"eval_overall_f1": 0.8344733242134064,
"eval_overall_precision": 0.7922077922077922,
"eval_overall_recall": 0.8815028901734104,
"eval_runtime": 0.3835,
"eval_samples_per_second": 487.614,
"eval_steps_per_second": 7.823,
"step": 10282
},
{
"epoch": 98.0,
"grad_norm": 0.08422825485467911,
"learning_rate": 1.0000000000000002e-06,
"loss": 0.0222,
"step": 10388
},
{
"epoch": 98.0,
"eval_LOCATION_f1": 0.8243243243243245,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7721518987341772,
"eval_LOCATION_recall": 0.8840579710144928,
"eval_ORGANIZATION_f1": 0.711111111111111,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.6486486486486487,
"eval_ORGANIZATION_recall": 0.7868852459016393,
"eval_PERSON_f1": 0.9142857142857143,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.8888888888888888,
"eval_PERSON_recall": 0.9411764705882353,
"eval_QUANTITY_f1": 0.8059701492537314,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.7714285714285715,
"eval_QUANTITY_recall": 0.84375,
"eval_TIME_f1": 0.7999999999999999,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.7647058823529411,
"eval_TIME_recall": 0.8387096774193549,
"eval_loss": 0.1667957454919815,
"eval_overall_accuracy": 0.9648253653703245,
"eval_overall_f1": 0.8383561643835618,
"eval_overall_precision": 0.796875,
"eval_overall_recall": 0.884393063583815,
"eval_runtime": 0.3821,
"eval_samples_per_second": 489.465,
"eval_steps_per_second": 7.852,
"step": 10388
},
{
"epoch": 99.0,
"grad_norm": 0.2250053733587265,
"learning_rate": 5.000000000000001e-07,
"loss": 0.0239,
"step": 10494
},
{
"epoch": 99.0,
"eval_LOCATION_f1": 0.8243243243243245,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7721518987341772,
"eval_LOCATION_recall": 0.8840579710144928,
"eval_ORGANIZATION_f1": 0.7164179104477612,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.6575342465753424,
"eval_ORGANIZATION_recall": 0.7868852459016393,
"eval_PERSON_f1": 0.9142857142857143,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.8888888888888888,
"eval_PERSON_recall": 0.9411764705882353,
"eval_QUANTITY_f1": 0.8059701492537314,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.7714285714285715,
"eval_QUANTITY_recall": 0.84375,
"eval_TIME_f1": 0.7999999999999999,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.7647058823529411,
"eval_TIME_recall": 0.8387096774193549,
"eval_loss": 0.1667199730873108,
"eval_overall_accuracy": 0.9648253653703245,
"eval_overall_f1": 0.839506172839506,
"eval_overall_precision": 0.7989556135770235,
"eval_overall_recall": 0.884393063583815,
"eval_runtime": 0.3828,
"eval_samples_per_second": 488.496,
"eval_steps_per_second": 7.837,
"step": 10494
},
{
"epoch": 100.0,
"grad_norm": 0.21176059544086456,
"learning_rate": 0.0,
"loss": 0.0232,
"step": 10600
},
{
"epoch": 100.0,
"eval_LOCATION_f1": 0.8243243243243245,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7721518987341772,
"eval_LOCATION_recall": 0.8840579710144928,
"eval_ORGANIZATION_f1": 0.7164179104477612,
"eval_ORGANIZATION_number": 61,
"eval_ORGANIZATION_precision": 0.6575342465753424,
"eval_ORGANIZATION_recall": 0.7868852459016393,
"eval_PERSON_f1": 0.9142857142857143,
"eval_PERSON_number": 153,
"eval_PERSON_precision": 0.8888888888888888,
"eval_PERSON_recall": 0.9411764705882353,
"eval_QUANTITY_f1": 0.8059701492537314,
"eval_QUANTITY_number": 32,
"eval_QUANTITY_precision": 0.7714285714285715,
"eval_QUANTITY_recall": 0.84375,
"eval_TIME_f1": 0.7999999999999999,
"eval_TIME_number": 31,
"eval_TIME_precision": 0.7647058823529411,
"eval_TIME_recall": 0.8387096774193549,
"eval_loss": 0.16671666502952576,
"eval_overall_accuracy": 0.9650730740648997,
"eval_overall_f1": 0.839506172839506,
"eval_overall_precision": 0.7989556135770235,
"eval_overall_recall": 0.884393063583815,
"eval_runtime": 0.3813,
"eval_samples_per_second": 490.38,
"eval_steps_per_second": 7.867,
"step": 10600
},
{
"epoch": 100.0,
"step": 10600,
"total_flos": 5088556202474382.0,
"train_loss": 0.07070975787234757,
"train_runtime": 630.6573,
"train_samples_per_second": 267.499,
"train_steps_per_second": 16.808
}
],
"logging_steps": 500,
"max_steps": 10600,
"num_input_tokens_seen": 0,
"num_train_epochs": 100,
"save_steps": 500,
"total_flos": 5088556202474382.0,
"train_batch_size": 16,
"trial_name": null,
"trial_params": null
}