nerugm-lora-r16-4 / trainer_state.json
apwic's picture
End of training
996bd33 verified
{
"best_metric": null,
"best_model_checkpoint": null,
"epoch": 100.0,
"eval_steps": 500,
"global_step": 10600,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 1.0,
"grad_norm": 1.549831748008728,
"learning_rate": 4.9500000000000004e-05,
"loss": 1.1472,
"step": 106
},
{
"epoch": 1.0,
"eval_LOCATION_f1": 0.0,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.0,
"eval_LOCATION_recall": 0.0,
"eval_ORGANIZATION_f1": 0.0,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.0,
"eval_ORGANIZATION_recall": 0.0,
"eval_PERSON_f1": 0.0,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.0,
"eval_PERSON_recall": 0.0,
"eval_QUANTITY_f1": 0.0,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.0,
"eval_QUANTITY_recall": 0.0,
"eval_TIME_f1": 0.0,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.0,
"eval_TIME_recall": 0.0,
"eval_loss": 0.7123244404792786,
"eval_overall_accuracy": 0.8365739601279842,
"eval_overall_f1": 0.0,
"eval_overall_precision": 0.0,
"eval_overall_recall": 0.0,
"eval_runtime": 0.3731,
"eval_samples_per_second": 501.176,
"eval_steps_per_second": 8.04,
"step": 106
},
{
"epoch": 2.0,
"grad_norm": 1.0792208909988403,
"learning_rate": 4.9e-05,
"loss": 0.6802,
"step": 212
},
{
"epoch": 2.0,
"eval_LOCATION_f1": 0.0,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.0,
"eval_LOCATION_recall": 0.0,
"eval_ORGANIZATION_f1": 0.0,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.0,
"eval_ORGANIZATION_recall": 0.0,
"eval_PERSON_f1": 0.012738853503184716,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.14285714285714285,
"eval_PERSON_recall": 0.006666666666666667,
"eval_QUANTITY_f1": 0.0,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.0,
"eval_QUANTITY_recall": 0.0,
"eval_TIME_f1": 0.0,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.0,
"eval_TIME_recall": 0.0,
"eval_loss": 0.5882730484008789,
"eval_overall_accuracy": 0.8385429485601772,
"eval_overall_f1": 0.005524861878453039,
"eval_overall_precision": 0.09090909090909091,
"eval_overall_recall": 0.002849002849002849,
"eval_runtime": 0.3704,
"eval_samples_per_second": 504.825,
"eval_steps_per_second": 8.099,
"step": 212
},
{
"epoch": 3.0,
"grad_norm": 1.0924339294433594,
"learning_rate": 4.85e-05,
"loss": 0.56,
"step": 318
},
{
"epoch": 3.0,
"eval_LOCATION_f1": 0.1176470588235294,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.4166666666666667,
"eval_LOCATION_recall": 0.0684931506849315,
"eval_ORGANIZATION_f1": 0.025974025974025976,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.08333333333333333,
"eval_ORGANIZATION_recall": 0.015384615384615385,
"eval_PERSON_f1": 0.17674418604651165,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.2923076923076923,
"eval_PERSON_recall": 0.12666666666666668,
"eval_QUANTITY_f1": 0.0,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.0,
"eval_QUANTITY_recall": 0.0,
"eval_TIME_f1": 0.25925925925925924,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.35,
"eval_TIME_recall": 0.20588235294117646,
"eval_loss": 0.4647313952445984,
"eval_overall_accuracy": 0.8616785626384444,
"eval_overall_f1": 0.1391304347826087,
"eval_overall_precision": 0.29357798165137616,
"eval_overall_recall": 0.09116809116809117,
"eval_runtime": 0.3714,
"eval_samples_per_second": 503.536,
"eval_steps_per_second": 8.078,
"step": 318
},
{
"epoch": 4.0,
"grad_norm": 1.4220308065414429,
"learning_rate": 4.8e-05,
"loss": 0.4294,
"step": 424
},
{
"epoch": 4.0,
"eval_LOCATION_f1": 0.39669421487603307,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.5,
"eval_LOCATION_recall": 0.3287671232876712,
"eval_ORGANIZATION_f1": 0.12903225806451613,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.21428571428571427,
"eval_ORGANIZATION_recall": 0.09230769230769231,
"eval_PERSON_f1": 0.6538461538461539,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.6296296296296297,
"eval_PERSON_recall": 0.68,
"eval_QUANTITY_f1": 0.13333333333333333,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.1875,
"eval_QUANTITY_recall": 0.10344827586206896,
"eval_TIME_f1": 0.5671641791044776,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.5757575757575758,
"eval_TIME_recall": 0.5588235294117647,
"eval_loss": 0.3323652446269989,
"eval_overall_accuracy": 0.907703667240955,
"eval_overall_f1": 0.4827586206896552,
"eval_overall_precision": 0.5365853658536586,
"eval_overall_recall": 0.43874643874643876,
"eval_runtime": 0.374,
"eval_samples_per_second": 500.058,
"eval_steps_per_second": 8.022,
"step": 424
},
{
"epoch": 5.0,
"grad_norm": 1.3654524087905884,
"learning_rate": 4.75e-05,
"loss": 0.324,
"step": 530
},
{
"epoch": 5.0,
"eval_LOCATION_f1": 0.564102564102564,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.5301204819277109,
"eval_LOCATION_recall": 0.6027397260273972,
"eval_ORGANIZATION_f1": 0.45255474452554745,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.4305555555555556,
"eval_ORGANIZATION_recall": 0.47692307692307695,
"eval_PERSON_f1": 0.8263473053892216,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.75,
"eval_PERSON_recall": 0.92,
"eval_QUANTITY_f1": 0.39999999999999997,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.3870967741935484,
"eval_QUANTITY_recall": 0.41379310344827586,
"eval_TIME_f1": 0.6849315068493151,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.6410256410256411,
"eval_TIME_recall": 0.7352941176470589,
"eval_loss": 0.26078376173973083,
"eval_overall_accuracy": 0.9308392813192222,
"eval_overall_f1": 0.6578947368421052,
"eval_overall_precision": 0.6112469437652812,
"eval_overall_recall": 0.7122507122507122,
"eval_runtime": 0.3725,
"eval_samples_per_second": 502.055,
"eval_steps_per_second": 8.054,
"step": 530
},
{
"epoch": 6.0,
"grad_norm": 1.6405872106552124,
"learning_rate": 4.7e-05,
"loss": 0.2665,
"step": 636
},
{
"epoch": 6.0,
"eval_LOCATION_f1": 0.6826347305389222,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.6063829787234043,
"eval_LOCATION_recall": 0.7808219178082192,
"eval_ORGANIZATION_f1": 0.5394736842105263,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.47126436781609193,
"eval_ORGANIZATION_recall": 0.6307692307692307,
"eval_PERSON_f1": 0.8363636363636363,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.7666666666666667,
"eval_PERSON_recall": 0.92,
"eval_QUANTITY_f1": 0.4444444444444445,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.4117647058823529,
"eval_QUANTITY_recall": 0.4827586206896552,
"eval_TIME_f1": 0.7027027027027027,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.65,
"eval_TIME_recall": 0.7647058823529411,
"eval_loss": 0.23299816250801086,
"eval_overall_accuracy": 0.934531134629584,
"eval_overall_f1": 0.7022900763358779,
"eval_overall_precision": 0.6344827586206897,
"eval_overall_recall": 0.7863247863247863,
"eval_runtime": 0.3778,
"eval_samples_per_second": 494.969,
"eval_steps_per_second": 7.941,
"step": 636
},
{
"epoch": 7.0,
"grad_norm": 1.7495594024658203,
"learning_rate": 4.6500000000000005e-05,
"loss": 0.2275,
"step": 742
},
{
"epoch": 7.0,
"eval_LOCATION_f1": 0.7349397590361444,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.6559139784946236,
"eval_LOCATION_recall": 0.8356164383561644,
"eval_ORGANIZATION_f1": 0.5660377358490566,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.4787234042553192,
"eval_ORGANIZATION_recall": 0.6923076923076923,
"eval_PERSON_f1": 0.8475609756097561,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.7808988764044944,
"eval_PERSON_recall": 0.9266666666666666,
"eval_QUANTITY_f1": 0.4444444444444445,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.4117647058823529,
"eval_QUANTITY_recall": 0.4827586206896552,
"eval_TIME_f1": 0.7027027027027027,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.65,
"eval_TIME_recall": 0.7647058823529411,
"eval_loss": 0.19754259288311005,
"eval_overall_accuracy": 0.9392074821560423,
"eval_overall_f1": 0.7215189873417722,
"eval_overall_precision": 0.6492027334851936,
"eval_overall_recall": 0.811965811965812,
"eval_runtime": 0.382,
"eval_samples_per_second": 489.509,
"eval_steps_per_second": 7.853,
"step": 742
},
{
"epoch": 8.0,
"grad_norm": 1.2530863285064697,
"learning_rate": 4.600000000000001e-05,
"loss": 0.2049,
"step": 848
},
{
"epoch": 8.0,
"eval_LOCATION_f1": 0.7283236994219653,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.63,
"eval_LOCATION_recall": 0.863013698630137,
"eval_ORGANIZATION_f1": 0.5256410256410257,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.45054945054945056,
"eval_ORGANIZATION_recall": 0.6307692307692307,
"eval_PERSON_f1": 0.851851851851852,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.7931034482758621,
"eval_PERSON_recall": 0.92,
"eval_QUANTITY_f1": 0.5538461538461539,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.5,
"eval_QUANTITY_recall": 0.6206896551724138,
"eval_TIME_f1": 0.72,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.6585365853658537,
"eval_TIME_recall": 0.7941176470588235,
"eval_loss": 0.1830800473690033,
"eval_overall_accuracy": 0.9419148412503077,
"eval_overall_f1": 0.7238335435056746,
"eval_overall_precision": 0.6493212669683258,
"eval_overall_recall": 0.8176638176638177,
"eval_runtime": 0.3764,
"eval_samples_per_second": 496.877,
"eval_steps_per_second": 7.971,
"step": 848
},
{
"epoch": 9.0,
"grad_norm": 2.133810520172119,
"learning_rate": 4.55e-05,
"loss": 0.1888,
"step": 954
},
{
"epoch": 9.0,
"eval_LOCATION_f1": 0.7261904761904762,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.6421052631578947,
"eval_LOCATION_recall": 0.8356164383561644,
"eval_ORGANIZATION_f1": 0.5822784810126582,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.4946236559139785,
"eval_ORGANIZATION_recall": 0.7076923076923077,
"eval_PERSON_f1": 0.8374999999999999,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.788235294117647,
"eval_PERSON_recall": 0.8933333333333333,
"eval_QUANTITY_f1": 0.47619047619047616,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.4411764705882353,
"eval_QUANTITY_recall": 0.5172413793103449,
"eval_TIME_f1": 0.7105263157894737,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.6428571428571429,
"eval_TIME_recall": 0.7941176470588235,
"eval_loss": 0.17504610121250153,
"eval_overall_accuracy": 0.9431454590204282,
"eval_overall_f1": 0.7210191082802548,
"eval_overall_precision": 0.652073732718894,
"eval_overall_recall": 0.8062678062678063,
"eval_runtime": 0.3734,
"eval_samples_per_second": 500.739,
"eval_steps_per_second": 8.033,
"step": 954
},
{
"epoch": 10.0,
"grad_norm": 0.8962897658348083,
"learning_rate": 4.5e-05,
"loss": 0.1759,
"step": 1060
},
{
"epoch": 10.0,
"eval_LOCATION_f1": 0.7643312101910829,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.7142857142857143,
"eval_LOCATION_recall": 0.821917808219178,
"eval_ORGANIZATION_f1": 0.6086956521739131,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.5104166666666666,
"eval_ORGANIZATION_recall": 0.7538461538461538,
"eval_PERSON_f1": 0.8348909657320873,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.783625730994152,
"eval_PERSON_recall": 0.8933333333333333,
"eval_QUANTITY_f1": 0.6060606060606061,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.5405405405405406,
"eval_QUANTITY_recall": 0.6896551724137931,
"eval_TIME_f1": 0.7368421052631577,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.6666666666666666,
"eval_TIME_recall": 0.8235294117647058,
"eval_loss": 0.16711482405662537,
"eval_overall_accuracy": 0.9458528181146936,
"eval_overall_f1": 0.7451984635083226,
"eval_overall_precision": 0.6767441860465117,
"eval_overall_recall": 0.8290598290598291,
"eval_runtime": 0.3754,
"eval_samples_per_second": 498.083,
"eval_steps_per_second": 7.991,
"step": 1060
},
{
"epoch": 11.0,
"grad_norm": 1.1401879787445068,
"learning_rate": 4.4500000000000004e-05,
"loss": 0.1691,
"step": 1166
},
{
"epoch": 11.0,
"eval_LOCATION_f1": 0.7738095238095238,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.6842105263157895,
"eval_LOCATION_recall": 0.8904109589041096,
"eval_ORGANIZATION_f1": 0.6415094339622641,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.5425531914893617,
"eval_ORGANIZATION_recall": 0.7846153846153846,
"eval_PERSON_f1": 0.8500000000000001,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8,
"eval_PERSON_recall": 0.9066666666666666,
"eval_QUANTITY_f1": 0.6363636363636365,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.5675675675675675,
"eval_QUANTITY_recall": 0.7241379310344828,
"eval_TIME_f1": 0.7894736842105262,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.7142857142857143,
"eval_TIME_recall": 0.8823529411764706,
"eval_loss": 0.16388720273971558,
"eval_overall_accuracy": 0.9463450652227419,
"eval_overall_f1": 0.7680608365019013,
"eval_overall_precision": 0.6917808219178082,
"eval_overall_recall": 0.8632478632478633,
"eval_runtime": 0.3746,
"eval_samples_per_second": 499.243,
"eval_steps_per_second": 8.009,
"step": 1166
},
{
"epoch": 12.0,
"grad_norm": 1.234176754951477,
"learning_rate": 4.4000000000000006e-05,
"loss": 0.1569,
"step": 1272
},
{
"epoch": 12.0,
"eval_LOCATION_f1": 0.7901234567901235,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.7191011235955056,
"eval_LOCATION_recall": 0.8767123287671232,
"eval_ORGANIZATION_f1": 0.625,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.5263157894736842,
"eval_ORGANIZATION_recall": 0.7692307692307693,
"eval_PERSON_f1": 0.8385093167701863,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.7848837209302325,
"eval_PERSON_recall": 0.9,
"eval_QUANTITY_f1": 0.6086956521739131,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.525,
"eval_QUANTITY_recall": 0.7241379310344828,
"eval_TIME_f1": 0.7532467532467532,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.6744186046511628,
"eval_TIME_recall": 0.8529411764705882,
"eval_loss": 0.16664613783359528,
"eval_overall_accuracy": 0.9458528181146936,
"eval_overall_f1": 0.7569620253164556,
"eval_overall_precision": 0.6810933940774487,
"eval_overall_recall": 0.8518518518518519,
"eval_runtime": 0.3735,
"eval_samples_per_second": 500.672,
"eval_steps_per_second": 8.032,
"step": 1272
},
{
"epoch": 13.0,
"grad_norm": 1.1105190515518188,
"learning_rate": 4.35e-05,
"loss": 0.1512,
"step": 1378
},
{
"epoch": 13.0,
"eval_LOCATION_f1": 0.7749999999999999,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.7126436781609196,
"eval_LOCATION_recall": 0.8493150684931506,
"eval_ORGANIZATION_f1": 0.6357615894039734,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.5581395348837209,
"eval_ORGANIZATION_recall": 0.7384615384615385,
"eval_PERSON_f1": 0.84375,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.7941176470588235,
"eval_PERSON_recall": 0.9,
"eval_QUANTITY_f1": 0.6268656716417911,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.5526315789473685,
"eval_QUANTITY_recall": 0.7241379310344828,
"eval_TIME_f1": 0.8108108108108107,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.75,
"eval_TIME_recall": 0.8823529411764706,
"eval_loss": 0.1505931168794632,
"eval_overall_accuracy": 0.9510214127492,
"eval_overall_f1": 0.766839378238342,
"eval_overall_precision": 0.7030878859857482,
"eval_overall_recall": 0.8433048433048433,
"eval_runtime": 0.3701,
"eval_samples_per_second": 505.237,
"eval_steps_per_second": 8.105,
"step": 1378
},
{
"epoch": 14.0,
"grad_norm": 1.2889316082000732,
"learning_rate": 4.3e-05,
"loss": 0.1492,
"step": 1484
},
{
"epoch": 14.0,
"eval_LOCATION_f1": 0.7901234567901235,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.7191011235955056,
"eval_LOCATION_recall": 0.8767123287671232,
"eval_ORGANIZATION_f1": 0.6257668711656441,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.5204081632653061,
"eval_ORGANIZATION_recall": 0.7846153846153846,
"eval_PERSON_f1": 0.8411214953271027,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.7894736842105263,
"eval_PERSON_recall": 0.9,
"eval_QUANTITY_f1": 0.6865671641791046,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.6052631578947368,
"eval_QUANTITY_recall": 0.7931034482758621,
"eval_TIME_f1": 0.7894736842105262,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.7142857142857143,
"eval_TIME_recall": 0.8823529411764706,
"eval_loss": 0.15868589282035828,
"eval_overall_accuracy": 0.9483140536549348,
"eval_overall_f1": 0.7680608365019013,
"eval_overall_precision": 0.6917808219178082,
"eval_overall_recall": 0.8632478632478633,
"eval_runtime": 0.3734,
"eval_samples_per_second": 500.783,
"eval_steps_per_second": 8.034,
"step": 1484
},
{
"epoch": 15.0,
"grad_norm": 1.1166456937789917,
"learning_rate": 4.25e-05,
"loss": 0.1422,
"step": 1590
},
{
"epoch": 15.0,
"eval_LOCATION_f1": 0.7852760736196318,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.7111111111111111,
"eval_LOCATION_recall": 0.8767123287671232,
"eval_ORGANIZATION_f1": 0.6134969325153374,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.5102040816326531,
"eval_ORGANIZATION_recall": 0.7692307692307693,
"eval_PERSON_f1": 0.8500000000000001,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8,
"eval_PERSON_recall": 0.9066666666666666,
"eval_QUANTITY_f1": 0.7272727272727273,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.6486486486486487,
"eval_QUANTITY_recall": 0.8275862068965517,
"eval_TIME_f1": 0.8051948051948051,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.7209302325581395,
"eval_TIME_recall": 0.9117647058823529,
"eval_loss": 0.15712317824363708,
"eval_overall_accuracy": 0.9483140536549348,
"eval_overall_f1": 0.7731305449936628,
"eval_overall_precision": 0.6963470319634704,
"eval_overall_recall": 0.8689458689458689,
"eval_runtime": 0.3753,
"eval_samples_per_second": 498.228,
"eval_steps_per_second": 7.993,
"step": 1590
},
{
"epoch": 16.0,
"grad_norm": 1.7718479633331299,
"learning_rate": 4.2e-05,
"loss": 0.1386,
"step": 1696
},
{
"epoch": 16.0,
"eval_LOCATION_f1": 0.782608695652174,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.7159090909090909,
"eval_LOCATION_recall": 0.863013698630137,
"eval_ORGANIZATION_f1": 0.6233766233766234,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.5393258426966292,
"eval_ORGANIZATION_recall": 0.7384615384615385,
"eval_PERSON_f1": 0.8714733542319748,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8224852071005917,
"eval_PERSON_recall": 0.9266666666666666,
"eval_QUANTITY_f1": 0.7352941176470588,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.6410256410256411,
"eval_QUANTITY_recall": 0.8620689655172413,
"eval_TIME_f1": 0.7792207792207793,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.6976744186046512,
"eval_TIME_recall": 0.8823529411764706,
"eval_loss": 0.1536765843629837,
"eval_overall_accuracy": 0.9502830420871278,
"eval_overall_f1": 0.7830551989730424,
"eval_overall_precision": 0.7126168224299065,
"eval_overall_recall": 0.8689458689458689,
"eval_runtime": 0.3723,
"eval_samples_per_second": 502.251,
"eval_steps_per_second": 8.058,
"step": 1696
},
{
"epoch": 17.0,
"grad_norm": 2.4890553951263428,
"learning_rate": 4.15e-05,
"loss": 0.1351,
"step": 1802
},
{
"epoch": 17.0,
"eval_LOCATION_f1": 0.7974683544303799,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.7411764705882353,
"eval_LOCATION_recall": 0.863013698630137,
"eval_ORGANIZATION_f1": 0.6219512195121952,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.5151515151515151,
"eval_ORGANIZATION_recall": 0.7846153846153846,
"eval_PERSON_f1": 0.8698412698412699,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8303030303030303,
"eval_PERSON_recall": 0.9133333333333333,
"eval_QUANTITY_f1": 0.7076923076923076,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.6388888888888888,
"eval_QUANTITY_recall": 0.7931034482758621,
"eval_TIME_f1": 0.7894736842105262,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.7142857142857143,
"eval_TIME_recall": 0.8823529411764706,
"eval_loss": 0.15198422968387604,
"eval_overall_accuracy": 0.9500369185331036,
"eval_overall_f1": 0.7814910025706941,
"eval_overall_precision": 0.711943793911007,
"eval_overall_recall": 0.8660968660968661,
"eval_runtime": 0.3738,
"eval_samples_per_second": 500.243,
"eval_steps_per_second": 8.025,
"step": 1802
},
{
"epoch": 18.0,
"grad_norm": 3.517162561416626,
"learning_rate": 4.1e-05,
"loss": 0.1397,
"step": 1908
},
{
"epoch": 18.0,
"eval_LOCATION_f1": 0.7848101265822783,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.7294117647058823,
"eval_LOCATION_recall": 0.8493150684931506,
"eval_ORGANIZATION_f1": 0.6,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.5052631578947369,
"eval_ORGANIZATION_recall": 0.7384615384615385,
"eval_PERSON_f1": 0.8698412698412699,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8303030303030303,
"eval_PERSON_recall": 0.9133333333333333,
"eval_QUANTITY_f1": 0.7575757575757576,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.6756756756756757,
"eval_QUANTITY_recall": 0.8620689655172413,
"eval_TIME_f1": 0.8157894736842106,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.7380952380952381,
"eval_TIME_recall": 0.9117647058823529,
"eval_loss": 0.1488378345966339,
"eval_overall_accuracy": 0.9500369185331036,
"eval_overall_f1": 0.7819354838709679,
"eval_overall_precision": 0.714622641509434,
"eval_overall_recall": 0.8632478632478633,
"eval_runtime": 0.375,
"eval_samples_per_second": 498.682,
"eval_steps_per_second": 8.0,
"step": 1908
},
{
"epoch": 19.0,
"grad_norm": 0.9577983021736145,
"learning_rate": 4.05e-05,
"loss": 0.1332,
"step": 2014
},
{
"epoch": 19.0,
"eval_LOCATION_f1": 0.802547770700637,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.75,
"eval_LOCATION_recall": 0.863013698630137,
"eval_ORGANIZATION_f1": 0.6296296296296297,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.5257731958762887,
"eval_ORGANIZATION_recall": 0.7846153846153846,
"eval_PERSON_f1": 0.8670886075949367,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8253012048192772,
"eval_PERSON_recall": 0.9133333333333333,
"eval_QUANTITY_f1": 0.6461538461538462,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.5833333333333334,
"eval_QUANTITY_recall": 0.7241379310344828,
"eval_TIME_f1": 0.8266666666666665,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.7560975609756098,
"eval_TIME_recall": 0.9117647058823529,
"eval_loss": 0.14682170748710632,
"eval_overall_accuracy": 0.9512675363032242,
"eval_overall_f1": 0.7819354838709679,
"eval_overall_precision": 0.714622641509434,
"eval_overall_recall": 0.8632478632478633,
"eval_runtime": 0.3719,
"eval_samples_per_second": 502.788,
"eval_steps_per_second": 8.066,
"step": 2014
},
{
"epoch": 20.0,
"grad_norm": 1.0945817232131958,
"learning_rate": 4e-05,
"loss": 0.1258,
"step": 2120
},
{
"epoch": 20.0,
"eval_LOCATION_f1": 0.7974683544303799,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.7411764705882353,
"eval_LOCATION_recall": 0.863013698630137,
"eval_ORGANIZATION_f1": 0.6216216216216216,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.5542168674698795,
"eval_ORGANIZATION_recall": 0.7076923076923077,
"eval_PERSON_f1": 0.8670886075949367,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8253012048192772,
"eval_PERSON_recall": 0.9133333333333333,
"eval_QUANTITY_f1": 0.7272727272727273,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.6486486486486487,
"eval_QUANTITY_recall": 0.8275862068965517,
"eval_TIME_f1": 0.8266666666666665,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.7560975609756098,
"eval_TIME_recall": 0.9117647058823529,
"eval_loss": 0.14338740706443787,
"eval_overall_accuracy": 0.9527442776273689,
"eval_overall_f1": 0.7889908256880734,
"eval_overall_precision": 0.7305825242718447,
"eval_overall_recall": 0.8575498575498576,
"eval_runtime": 0.3718,
"eval_samples_per_second": 502.95,
"eval_steps_per_second": 8.069,
"step": 2120
},
{
"epoch": 21.0,
"grad_norm": 1.6282328367233276,
"learning_rate": 3.9500000000000005e-05,
"loss": 0.1231,
"step": 2226
},
{
"epoch": 21.0,
"eval_LOCATION_f1": 0.7848101265822783,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.7294117647058823,
"eval_LOCATION_recall": 0.8493150684931506,
"eval_ORGANIZATION_f1": 0.625,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.569620253164557,
"eval_ORGANIZATION_recall": 0.6923076923076923,
"eval_PERSON_f1": 0.8643533123028392,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8203592814371258,
"eval_PERSON_recall": 0.9133333333333333,
"eval_QUANTITY_f1": 0.7076923076923076,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.6388888888888888,
"eval_QUANTITY_recall": 0.7931034482758621,
"eval_TIME_f1": 0.8266666666666665,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.7560975609756098,
"eval_TIME_recall": 0.9117647058823529,
"eval_loss": 0.1407139003276825,
"eval_overall_accuracy": 0.9544671425055378,
"eval_overall_f1": 0.785243741765481,
"eval_overall_precision": 0.7303921568627451,
"eval_overall_recall": 0.8490028490028491,
"eval_runtime": 0.3796,
"eval_samples_per_second": 492.652,
"eval_steps_per_second": 7.904,
"step": 2226
},
{
"epoch": 22.0,
"grad_norm": 1.690437912940979,
"learning_rate": 3.9000000000000006e-05,
"loss": 0.1218,
"step": 2332
},
{
"epoch": 22.0,
"eval_LOCATION_f1": 0.759493670886076,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.7058823529411765,
"eval_LOCATION_recall": 0.821917808219178,
"eval_ORGANIZATION_f1": 0.6144578313253013,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.504950495049505,
"eval_ORGANIZATION_recall": 0.7846153846153846,
"eval_PERSON_f1": 0.85625,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8058823529411765,
"eval_PERSON_recall": 0.9133333333333333,
"eval_QUANTITY_f1": 0.7076923076923076,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.6388888888888888,
"eval_QUANTITY_recall": 0.7931034482758621,
"eval_TIME_f1": 0.8533333333333334,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.7804878048780488,
"eval_TIME_recall": 0.9411764705882353,
"eval_loss": 0.14947740733623505,
"eval_overall_accuracy": 0.9500369185331036,
"eval_overall_f1": 0.7729591836734694,
"eval_overall_precision": 0.6997690531177829,
"eval_overall_recall": 0.8632478632478633,
"eval_runtime": 0.3754,
"eval_samples_per_second": 498.1,
"eval_steps_per_second": 7.991,
"step": 2332
},
{
"epoch": 23.0,
"grad_norm": 1.4524682760238647,
"learning_rate": 3.85e-05,
"loss": 0.1189,
"step": 2438
},
{
"epoch": 23.0,
"eval_LOCATION_f1": 0.8076923076923077,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.7590361445783133,
"eval_LOCATION_recall": 0.863013698630137,
"eval_ORGANIZATION_f1": 0.6451612903225806,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.5555555555555556,
"eval_ORGANIZATION_recall": 0.7692307692307693,
"eval_PERSON_f1": 0.8726114649681529,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8353658536585366,
"eval_PERSON_recall": 0.9133333333333333,
"eval_QUANTITY_f1": 0.696969696969697,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.6216216216216216,
"eval_QUANTITY_recall": 0.7931034482758621,
"eval_TIME_f1": 0.8800000000000001,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.8048780487804879,
"eval_TIME_recall": 0.9705882352941176,
"eval_loss": 0.13879932463169098,
"eval_overall_accuracy": 0.9561900073837066,
"eval_overall_f1": 0.7989556135770235,
"eval_overall_precision": 0.7373493975903614,
"eval_overall_recall": 0.8717948717948718,
"eval_runtime": 0.3734,
"eval_samples_per_second": 500.853,
"eval_steps_per_second": 8.035,
"step": 2438
},
{
"epoch": 24.0,
"grad_norm": 1.4798812866210938,
"learning_rate": 3.8e-05,
"loss": 0.1176,
"step": 2544
},
{
"epoch": 24.0,
"eval_LOCATION_f1": 0.7848101265822783,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.7294117647058823,
"eval_LOCATION_recall": 0.8493150684931506,
"eval_ORGANIZATION_f1": 0.6459627329192547,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.5416666666666666,
"eval_ORGANIZATION_recall": 0.8,
"eval_PERSON_f1": 0.8643533123028392,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8203592814371258,
"eval_PERSON_recall": 0.9133333333333333,
"eval_QUANTITY_f1": 0.7058823529411765,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.6153846153846154,
"eval_QUANTITY_recall": 0.8275862068965517,
"eval_TIME_f1": 0.7894736842105262,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.7142857142857143,
"eval_TIME_recall": 0.8823529411764706,
"eval_loss": 0.14802934229373932,
"eval_overall_accuracy": 0.9522520305193207,
"eval_overall_f1": 0.782051282051282,
"eval_overall_precision": 0.710955710955711,
"eval_overall_recall": 0.8689458689458689,
"eval_runtime": 0.373,
"eval_samples_per_second": 501.394,
"eval_steps_per_second": 8.044,
"step": 2544
},
{
"epoch": 25.0,
"grad_norm": 1.3379883766174316,
"learning_rate": 3.7500000000000003e-05,
"loss": 0.115,
"step": 2650
},
{
"epoch": 25.0,
"eval_LOCATION_f1": 0.7777777777777778,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.7078651685393258,
"eval_LOCATION_recall": 0.863013698630137,
"eval_ORGANIZATION_f1": 0.6335403726708075,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.53125,
"eval_ORGANIZATION_recall": 0.7846153846153846,
"eval_PERSON_f1": 0.8698412698412699,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8303030303030303,
"eval_PERSON_recall": 0.9133333333333333,
"eval_QUANTITY_f1": 0.7076923076923076,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.6388888888888888,
"eval_QUANTITY_recall": 0.7931034482758621,
"eval_TIME_f1": 0.8266666666666665,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.7560975609756098,
"eval_TIME_recall": 0.9117647058823529,
"eval_loss": 0.14569295942783356,
"eval_overall_accuracy": 0.9534826482894413,
"eval_overall_f1": 0.7840616966580978,
"eval_overall_precision": 0.7142857142857143,
"eval_overall_recall": 0.8689458689458689,
"eval_runtime": 0.3725,
"eval_samples_per_second": 502.079,
"eval_steps_per_second": 8.055,
"step": 2650
},
{
"epoch": 26.0,
"grad_norm": 2.1995344161987305,
"learning_rate": 3.7e-05,
"loss": 0.1175,
"step": 2756
},
{
"epoch": 26.0,
"eval_LOCATION_f1": 0.7973856209150326,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.7625,
"eval_LOCATION_recall": 0.8356164383561644,
"eval_ORGANIZATION_f1": 0.6308724832214766,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.5595238095238095,
"eval_ORGANIZATION_recall": 0.7230769230769231,
"eval_PERSON_f1": 0.879746835443038,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8373493975903614,
"eval_PERSON_recall": 0.9266666666666666,
"eval_QUANTITY_f1": 0.7058823529411765,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.6153846153846154,
"eval_QUANTITY_recall": 0.8275862068965517,
"eval_TIME_f1": 0.8266666666666665,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.7560975609756098,
"eval_TIME_recall": 0.9117647058823529,
"eval_loss": 0.14247295260429382,
"eval_overall_accuracy": 0.9554516367216342,
"eval_overall_f1": 0.7936925098554534,
"eval_overall_precision": 0.7365853658536585,
"eval_overall_recall": 0.8603988603988604,
"eval_runtime": 0.3735,
"eval_samples_per_second": 500.637,
"eval_steps_per_second": 8.032,
"step": 2756
},
{
"epoch": 27.0,
"grad_norm": 1.194440484046936,
"learning_rate": 3.65e-05,
"loss": 0.1099,
"step": 2862
},
{
"epoch": 27.0,
"eval_LOCATION_f1": 0.7820512820512822,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.7349397590361446,
"eval_LOCATION_recall": 0.8356164383561644,
"eval_ORGANIZATION_f1": 0.6883116883116883,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.5955056179775281,
"eval_ORGANIZATION_recall": 0.8153846153846154,
"eval_PERSON_f1": 0.8825396825396825,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8424242424242424,
"eval_PERSON_recall": 0.9266666666666666,
"eval_QUANTITY_f1": 0.6666666666666666,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.575,
"eval_QUANTITY_recall": 0.7931034482758621,
"eval_TIME_f1": 0.8311688311688312,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.7441860465116279,
"eval_TIME_recall": 0.9411764705882353,
"eval_loss": 0.14262671768665314,
"eval_overall_accuracy": 0.9556977602756583,
"eval_overall_f1": 0.7989623865110247,
"eval_overall_precision": 0.7333333333333333,
"eval_overall_recall": 0.8774928774928775,
"eval_runtime": 0.3711,
"eval_samples_per_second": 503.938,
"eval_steps_per_second": 8.085,
"step": 2862
},
{
"epoch": 28.0,
"grad_norm": 1.36868155002594,
"learning_rate": 3.6e-05,
"loss": 0.1108,
"step": 2968
},
{
"epoch": 28.0,
"eval_LOCATION_f1": 0.7999999999999999,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.7560975609756098,
"eval_LOCATION_recall": 0.8493150684931506,
"eval_ORGANIZATION_f1": 0.6842105263157896,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.5977011494252874,
"eval_ORGANIZATION_recall": 0.8,
"eval_PERSON_f1": 0.8706624605678233,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8263473053892215,
"eval_PERSON_recall": 0.92,
"eval_QUANTITY_f1": 0.6666666666666667,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.5945945945945946,
"eval_QUANTITY_recall": 0.7586206896551724,
"eval_TIME_f1": 0.8266666666666665,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.7560975609756098,
"eval_TIME_recall": 0.9117647058823529,
"eval_loss": 0.1398727297782898,
"eval_overall_accuracy": 0.9554516367216342,
"eval_overall_f1": 0.7973856209150327,
"eval_overall_precision": 0.7367149758454107,
"eval_overall_recall": 0.8689458689458689,
"eval_runtime": 0.3749,
"eval_samples_per_second": 498.749,
"eval_steps_per_second": 8.001,
"step": 2968
},
{
"epoch": 29.0,
"grad_norm": 0.8069501519203186,
"learning_rate": 3.55e-05,
"loss": 0.1071,
"step": 3074
},
{
"epoch": 29.0,
"eval_LOCATION_f1": 0.782608695652174,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.7159090909090909,
"eval_LOCATION_recall": 0.863013698630137,
"eval_ORGANIZATION_f1": 0.6506024096385542,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.5346534653465347,
"eval_ORGANIZATION_recall": 0.8307692307692308,
"eval_PERSON_f1": 0.877742946708464,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8284023668639053,
"eval_PERSON_recall": 0.9333333333333333,
"eval_QUANTITY_f1": 0.716417910447761,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.631578947368421,
"eval_QUANTITY_recall": 0.8275862068965517,
"eval_TIME_f1": 0.8421052631578947,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.7619047619047619,
"eval_TIME_recall": 0.9411764705882353,
"eval_loss": 0.14704711735248566,
"eval_overall_accuracy": 0.9512675363032242,
"eval_overall_f1": 0.7934093789607097,
"eval_overall_precision": 0.7146118721461188,
"eval_overall_recall": 0.8917378917378918,
"eval_runtime": 0.3733,
"eval_samples_per_second": 500.911,
"eval_steps_per_second": 8.036,
"step": 3074
},
{
"epoch": 30.0,
"grad_norm": 1.9499945640563965,
"learning_rate": 3.5e-05,
"loss": 0.1075,
"step": 3180
},
{
"epoch": 30.0,
"eval_LOCATION_f1": 0.7999999999999999,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.7560975609756098,
"eval_LOCATION_recall": 0.8493150684931506,
"eval_ORGANIZATION_f1": 0.6714285714285715,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6266666666666667,
"eval_ORGANIZATION_recall": 0.7230769230769231,
"eval_PERSON_f1": 0.8616352201257862,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8154761904761905,
"eval_PERSON_recall": 0.9133333333333333,
"eval_QUANTITY_f1": 0.6461538461538462,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.5833333333333334,
"eval_QUANTITY_recall": 0.7241379310344828,
"eval_TIME_f1": 0.9041095890410958,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.8461538461538461,
"eval_TIME_recall": 0.9705882352941176,
"eval_loss": 0.13154004514217377,
"eval_overall_accuracy": 0.956928378045779,
"eval_overall_f1": 0.7989347536617842,
"eval_overall_precision": 0.75,
"eval_overall_recall": 0.8547008547008547,
"eval_runtime": 0.3718,
"eval_samples_per_second": 502.965,
"eval_steps_per_second": 8.069,
"step": 3180
},
{
"epoch": 31.0,
"grad_norm": 0.5096124410629272,
"learning_rate": 3.45e-05,
"loss": 0.1053,
"step": 3286
},
{
"epoch": 31.0,
"eval_LOCATION_f1": 0.8051948051948052,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.7654320987654321,
"eval_LOCATION_recall": 0.8493150684931506,
"eval_ORGANIZATION_f1": 0.6753246753246754,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.5842696629213483,
"eval_ORGANIZATION_recall": 0.8,
"eval_PERSON_f1": 0.879746835443038,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8373493975903614,
"eval_PERSON_recall": 0.9266666666666666,
"eval_QUANTITY_f1": 0.676470588235294,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.5897435897435898,
"eval_QUANTITY_recall": 0.7931034482758621,
"eval_TIME_f1": 0.8266666666666665,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.7560975609756098,
"eval_TIME_recall": 0.9117647058823529,
"eval_loss": 0.1396467238664627,
"eval_overall_accuracy": 0.9554516367216342,
"eval_overall_f1": 0.8005215123859191,
"eval_overall_precision": 0.7379807692307693,
"eval_overall_recall": 0.8746438746438746,
"eval_runtime": 0.373,
"eval_samples_per_second": 501.294,
"eval_steps_per_second": 8.042,
"step": 3286
},
{
"epoch": 32.0,
"grad_norm": 0.622959554195404,
"learning_rate": 3.4000000000000007e-05,
"loss": 0.1027,
"step": 3392
},
{
"epoch": 32.0,
"eval_LOCATION_f1": 0.8129032258064516,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.7682926829268293,
"eval_LOCATION_recall": 0.863013698630137,
"eval_ORGANIZATION_f1": 0.6748466257668712,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.5612244897959183,
"eval_ORGANIZATION_recall": 0.8461538461538461,
"eval_PERSON_f1": 0.879746835443038,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8373493975903614,
"eval_PERSON_recall": 0.9266666666666666,
"eval_QUANTITY_f1": 0.696969696969697,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.6216216216216216,
"eval_QUANTITY_recall": 0.7931034482758621,
"eval_TIME_f1": 0.8533333333333334,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.7804878048780488,
"eval_TIME_recall": 0.9411764705882353,
"eval_loss": 0.14285185933113098,
"eval_overall_accuracy": 0.9549593896135861,
"eval_overall_f1": 0.8051612903225805,
"eval_overall_precision": 0.7358490566037735,
"eval_overall_recall": 0.8888888888888888,
"eval_runtime": 0.371,
"eval_samples_per_second": 504.003,
"eval_steps_per_second": 8.086,
"step": 3392
},
{
"epoch": 33.0,
"grad_norm": 1.2904415130615234,
"learning_rate": 3.35e-05,
"loss": 0.1036,
"step": 3498
},
{
"epoch": 33.0,
"eval_LOCATION_f1": 0.8051948051948052,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.7654320987654321,
"eval_LOCATION_recall": 0.8493150684931506,
"eval_ORGANIZATION_f1": 0.6878980891719746,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.5869565217391305,
"eval_ORGANIZATION_recall": 0.8307692307692308,
"eval_PERSON_f1": 0.8734177215189873,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8313253012048193,
"eval_PERSON_recall": 0.92,
"eval_QUANTITY_f1": 0.716417910447761,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.631578947368421,
"eval_QUANTITY_recall": 0.8275862068965517,
"eval_TIME_f1": 0.8378378378378379,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.775,
"eval_TIME_recall": 0.9117647058823529,
"eval_loss": 0.1392923891544342,
"eval_overall_accuracy": 0.9559438838296825,
"eval_overall_f1": 0.8046875000000001,
"eval_overall_precision": 0.7410071942446043,
"eval_overall_recall": 0.8803418803418803,
"eval_runtime": 0.3722,
"eval_samples_per_second": 502.408,
"eval_steps_per_second": 8.06,
"step": 3498
},
{
"epoch": 34.0,
"grad_norm": 3.785581350326538,
"learning_rate": 3.3e-05,
"loss": 0.1,
"step": 3604
},
{
"epoch": 34.0,
"eval_LOCATION_f1": 0.7999999999999999,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.7560975609756098,
"eval_LOCATION_recall": 0.8493150684931506,
"eval_ORGANIZATION_f1": 0.6838709677419356,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.5888888888888889,
"eval_ORGANIZATION_recall": 0.8153846153846154,
"eval_PERSON_f1": 0.8734177215189873,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8313253012048193,
"eval_PERSON_recall": 0.92,
"eval_QUANTITY_f1": 0.6865671641791046,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.6052631578947368,
"eval_QUANTITY_recall": 0.7931034482758621,
"eval_TIME_f1": 0.8533333333333334,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.7804878048780488,
"eval_TIME_recall": 0.9411764705882353,
"eval_loss": 0.13862958550453186,
"eval_overall_accuracy": 0.9561900073837066,
"eval_overall_f1": 0.8020833333333333,
"eval_overall_precision": 0.7386091127098321,
"eval_overall_recall": 0.8774928774928775,
"eval_runtime": 0.3727,
"eval_samples_per_second": 501.785,
"eval_steps_per_second": 8.05,
"step": 3604
},
{
"epoch": 35.0,
"grad_norm": 0.7286350131034851,
"learning_rate": 3.2500000000000004e-05,
"loss": 0.1013,
"step": 3710
},
{
"epoch": 35.0,
"eval_LOCATION_f1": 0.7948717948717949,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.7469879518072289,
"eval_LOCATION_recall": 0.8493150684931506,
"eval_ORGANIZATION_f1": 0.6875,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.5789473684210527,
"eval_ORGANIZATION_recall": 0.8461538461538461,
"eval_PERSON_f1": 0.8734177215189873,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8313253012048193,
"eval_PERSON_recall": 0.92,
"eval_QUANTITY_f1": 0.6956521739130435,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.6,
"eval_QUANTITY_recall": 0.8275862068965517,
"eval_TIME_f1": 0.8266666666666665,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.7560975609756098,
"eval_TIME_recall": 0.9117647058823529,
"eval_loss": 0.1437290757894516,
"eval_overall_accuracy": 0.9549593896135861,
"eval_overall_f1": 0.7989690721649485,
"eval_overall_precision": 0.7294117647058823,
"eval_overall_recall": 0.8831908831908832,
"eval_runtime": 0.3727,
"eval_samples_per_second": 501.777,
"eval_steps_per_second": 8.05,
"step": 3710
},
{
"epoch": 36.0,
"grad_norm": 0.8509505391120911,
"learning_rate": 3.2000000000000005e-05,
"loss": 0.0988,
"step": 3816
},
{
"epoch": 36.0,
"eval_LOCATION_f1": 0.7870967741935484,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.7439024390243902,
"eval_LOCATION_recall": 0.8356164383561644,
"eval_ORGANIZATION_f1": 0.6794871794871795,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.5824175824175825,
"eval_ORGANIZATION_recall": 0.8153846153846154,
"eval_PERSON_f1": 0.8761904761904761,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8363636363636363,
"eval_PERSON_recall": 0.92,
"eval_QUANTITY_f1": 0.676470588235294,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.5897435897435898,
"eval_QUANTITY_recall": 0.7931034482758621,
"eval_TIME_f1": 0.8266666666666665,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.7560975609756098,
"eval_TIME_recall": 0.9117647058823529,
"eval_loss": 0.14367760717868805,
"eval_overall_accuracy": 0.9547132660595619,
"eval_overall_f1": 0.7958387516254878,
"eval_overall_precision": 0.7320574162679426,
"eval_overall_recall": 0.8717948717948718,
"eval_runtime": 0.3724,
"eval_samples_per_second": 502.107,
"eval_steps_per_second": 8.055,
"step": 3816
},
{
"epoch": 37.0,
"grad_norm": 1.2342133522033691,
"learning_rate": 3.15e-05,
"loss": 0.0971,
"step": 3922
},
{
"epoch": 37.0,
"eval_LOCATION_f1": 0.7770700636942677,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.7261904761904762,
"eval_LOCATION_recall": 0.8356164383561644,
"eval_ORGANIZATION_f1": 0.6705882352941177,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.5428571428571428,
"eval_ORGANIZATION_recall": 0.8769230769230769,
"eval_PERSON_f1": 0.8706624605678233,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8263473053892215,
"eval_PERSON_recall": 0.92,
"eval_QUANTITY_f1": 0.676470588235294,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.5897435897435898,
"eval_QUANTITY_recall": 0.7931034482758621,
"eval_TIME_f1": 0.8,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.7317073170731707,
"eval_TIME_recall": 0.8823529411764706,
"eval_loss": 0.1551184207201004,
"eval_overall_accuracy": 0.9490524243170071,
"eval_overall_f1": 0.7852604828462516,
"eval_overall_precision": 0.7087155963302753,
"eval_overall_recall": 0.8803418803418803,
"eval_runtime": 0.3737,
"eval_samples_per_second": 500.4,
"eval_steps_per_second": 8.028,
"step": 3922
},
{
"epoch": 38.0,
"grad_norm": 1.0431395769119263,
"learning_rate": 3.1e-05,
"loss": 0.0967,
"step": 4028
},
{
"epoch": 38.0,
"eval_LOCATION_f1": 0.7973856209150326,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.7625,
"eval_LOCATION_recall": 0.8356164383561644,
"eval_ORGANIZATION_f1": 0.6805555555555556,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.620253164556962,
"eval_ORGANIZATION_recall": 0.7538461538461538,
"eval_PERSON_f1": 0.8761904761904761,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8363636363636363,
"eval_PERSON_recall": 0.92,
"eval_QUANTITY_f1": 0.6865671641791046,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.6052631578947368,
"eval_QUANTITY_recall": 0.7931034482758621,
"eval_TIME_f1": 0.8378378378378379,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.775,
"eval_TIME_recall": 0.9117647058823529,
"eval_loss": 0.13686208426952362,
"eval_overall_accuracy": 0.956928378045779,
"eval_overall_f1": 0.802124833997344,
"eval_overall_precision": 0.7512437810945274,
"eval_overall_recall": 0.8603988603988604,
"eval_runtime": 0.3727,
"eval_samples_per_second": 501.728,
"eval_steps_per_second": 8.049,
"step": 4028
},
{
"epoch": 39.0,
"grad_norm": 1.3837076425552368,
"learning_rate": 3.05e-05,
"loss": 0.0949,
"step": 4134
},
{
"epoch": 39.0,
"eval_LOCATION_f1": 0.7898089171974523,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.7380952380952381,
"eval_LOCATION_recall": 0.8493150684931506,
"eval_ORGANIZATION_f1": 0.6832298136645962,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.5729166666666666,
"eval_ORGANIZATION_recall": 0.8461538461538461,
"eval_PERSON_f1": 0.8761904761904761,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8363636363636363,
"eval_PERSON_recall": 0.92,
"eval_QUANTITY_f1": 0.6666666666666667,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.5945945945945946,
"eval_QUANTITY_recall": 0.7586206896551724,
"eval_TIME_f1": 0.8266666666666665,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.7560975609756098,
"eval_TIME_recall": 0.9117647058823529,
"eval_loss": 0.13983625173568726,
"eval_overall_accuracy": 0.9559438838296825,
"eval_overall_f1": 0.7958656330749354,
"eval_overall_precision": 0.7281323877068558,
"eval_overall_recall": 0.8774928774928775,
"eval_runtime": 0.3721,
"eval_samples_per_second": 502.567,
"eval_steps_per_second": 8.063,
"step": 4134
},
{
"epoch": 40.0,
"grad_norm": 0.6632676124572754,
"learning_rate": 3e-05,
"loss": 0.0956,
"step": 4240
},
{
"epoch": 40.0,
"eval_LOCATION_f1": 0.7770700636942677,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.7261904761904762,
"eval_LOCATION_recall": 0.8356164383561644,
"eval_ORGANIZATION_f1": 0.6973684210526315,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6091954022988506,
"eval_ORGANIZATION_recall": 0.8153846153846154,
"eval_PERSON_f1": 0.8789808917197452,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8414634146341463,
"eval_PERSON_recall": 0.92,
"eval_QUANTITY_f1": 0.676470588235294,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.5897435897435898,
"eval_QUANTITY_recall": 0.7931034482758621,
"eval_TIME_f1": 0.8378378378378379,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.775,
"eval_TIME_recall": 0.9117647058823529,
"eval_loss": 0.14134033024311066,
"eval_overall_accuracy": 0.9559438838296825,
"eval_overall_f1": 0.7999999999999999,
"eval_overall_precision": 0.7391304347826086,
"eval_overall_recall": 0.8717948717948718,
"eval_runtime": 0.3777,
"eval_samples_per_second": 495.154,
"eval_steps_per_second": 7.944,
"step": 4240
},
{
"epoch": 41.0,
"grad_norm": 0.36149993538856506,
"learning_rate": 2.95e-05,
"loss": 0.0913,
"step": 4346
},
{
"epoch": 41.0,
"eval_LOCATION_f1": 0.7898089171974523,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.7380952380952381,
"eval_LOCATION_recall": 0.8493150684931506,
"eval_ORGANIZATION_f1": 0.7051282051282052,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6043956043956044,
"eval_ORGANIZATION_recall": 0.8461538461538461,
"eval_PERSON_f1": 0.8789808917197452,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8414634146341463,
"eval_PERSON_recall": 0.92,
"eval_QUANTITY_f1": 0.6865671641791046,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.6052631578947368,
"eval_QUANTITY_recall": 0.7931034482758621,
"eval_TIME_f1": 0.8266666666666665,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.7560975609756098,
"eval_TIME_recall": 0.9117647058823529,
"eval_loss": 0.13970939815044403,
"eval_overall_accuracy": 0.9566822544917548,
"eval_overall_f1": 0.8036410923276982,
"eval_overall_precision": 0.7392344497607656,
"eval_overall_recall": 0.8803418803418803,
"eval_runtime": 0.3722,
"eval_samples_per_second": 502.411,
"eval_steps_per_second": 8.06,
"step": 4346
},
{
"epoch": 42.0,
"grad_norm": 0.5602841377258301,
"learning_rate": 2.9e-05,
"loss": 0.0949,
"step": 4452
},
{
"epoch": 42.0,
"eval_LOCATION_f1": 0.7870967741935484,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.7439024390243902,
"eval_LOCATION_recall": 0.8356164383561644,
"eval_ORGANIZATION_f1": 0.6923076923076923,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.5934065934065934,
"eval_ORGANIZATION_recall": 0.8307692307692308,
"eval_PERSON_f1": 0.8846153846153846,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8518518518518519,
"eval_PERSON_recall": 0.92,
"eval_QUANTITY_f1": 0.676470588235294,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.5897435897435898,
"eval_QUANTITY_recall": 0.7931034482758621,
"eval_TIME_f1": 0.8378378378378379,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.775,
"eval_TIME_recall": 0.9117647058823529,
"eval_loss": 0.1462649405002594,
"eval_overall_accuracy": 0.9547132660595619,
"eval_overall_f1": 0.8026143790849672,
"eval_overall_precision": 0.7415458937198067,
"eval_overall_recall": 0.8746438746438746,
"eval_runtime": 0.3742,
"eval_samples_per_second": 499.754,
"eval_steps_per_second": 8.017,
"step": 4452
},
{
"epoch": 43.0,
"grad_norm": 0.9771382808685303,
"learning_rate": 2.8499999999999998e-05,
"loss": 0.0919,
"step": 4558
},
{
"epoch": 43.0,
"eval_LOCATION_f1": 0.7820512820512822,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.7349397590361446,
"eval_LOCATION_recall": 0.8356164383561644,
"eval_ORGANIZATION_f1": 0.684931506849315,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6172839506172839,
"eval_ORGANIZATION_recall": 0.7692307692307693,
"eval_PERSON_f1": 0.8789808917197452,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8414634146341463,
"eval_PERSON_recall": 0.92,
"eval_QUANTITY_f1": 0.6666666666666667,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.5945945945945946,
"eval_QUANTITY_recall": 0.7586206896551724,
"eval_TIME_f1": 0.8266666666666665,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.7560975609756098,
"eval_TIME_recall": 0.9117647058823529,
"eval_loss": 0.1370939314365387,
"eval_overall_accuracy": 0.9566822544917548,
"eval_overall_f1": 0.7978863936591809,
"eval_overall_precision": 0.7438423645320197,
"eval_overall_recall": 0.8603988603988604,
"eval_runtime": 0.3709,
"eval_samples_per_second": 504.137,
"eval_steps_per_second": 8.088,
"step": 4558
},
{
"epoch": 44.0,
"grad_norm": 3.2234935760498047,
"learning_rate": 2.8000000000000003e-05,
"loss": 0.0895,
"step": 4664
},
{
"epoch": 44.0,
"eval_LOCATION_f1": 0.7999999999999999,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.7560975609756098,
"eval_LOCATION_recall": 0.8493150684931506,
"eval_ORGANIZATION_f1": 0.6758620689655173,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6125,
"eval_ORGANIZATION_recall": 0.7538461538461538,
"eval_PERSON_f1": 0.8825396825396825,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8424242424242424,
"eval_PERSON_recall": 0.9266666666666666,
"eval_QUANTITY_f1": 0.6865671641791046,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.6052631578947368,
"eval_QUANTITY_recall": 0.7931034482758621,
"eval_TIME_f1": 0.8648648648648648,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.8,
"eval_TIME_recall": 0.9411764705882353,
"eval_loss": 0.1338210105895996,
"eval_overall_accuracy": 0.9576667487078513,
"eval_overall_f1": 0.8068783068783069,
"eval_overall_precision": 0.7530864197530864,
"eval_overall_recall": 0.8689458689458689,
"eval_runtime": 0.3714,
"eval_samples_per_second": 503.565,
"eval_steps_per_second": 8.079,
"step": 4664
},
{
"epoch": 45.0,
"grad_norm": 3.458214282989502,
"learning_rate": 2.7500000000000004e-05,
"loss": 0.0899,
"step": 4770
},
{
"epoch": 45.0,
"eval_LOCATION_f1": 0.7792207792207793,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.7407407407407407,
"eval_LOCATION_recall": 0.821917808219178,
"eval_ORGANIZATION_f1": 0.6835443037974683,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.5806451612903226,
"eval_ORGANIZATION_recall": 0.8307692307692308,
"eval_PERSON_f1": 0.8789808917197452,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8414634146341463,
"eval_PERSON_recall": 0.92,
"eval_QUANTITY_f1": 0.6666666666666667,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.5945945945945946,
"eval_QUANTITY_recall": 0.7586206896551724,
"eval_TIME_f1": 0.8533333333333334,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.7804878048780488,
"eval_TIME_recall": 0.9411764705882353,
"eval_loss": 0.14024274051189423,
"eval_overall_accuracy": 0.956928378045779,
"eval_overall_f1": 0.7979139504563233,
"eval_overall_precision": 0.7355769230769231,
"eval_overall_recall": 0.8717948717948718,
"eval_runtime": 0.4103,
"eval_samples_per_second": 455.728,
"eval_steps_per_second": 7.311,
"step": 4770
},
{
"epoch": 46.0,
"grad_norm": 1.2206172943115234,
"learning_rate": 2.7000000000000002e-05,
"loss": 0.088,
"step": 4876
},
{
"epoch": 46.0,
"eval_LOCATION_f1": 0.7922077922077922,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.7530864197530864,
"eval_LOCATION_recall": 0.8356164383561644,
"eval_ORGANIZATION_f1": 0.7019867549668873,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6162790697674418,
"eval_ORGANIZATION_recall": 0.8153846153846154,
"eval_PERSON_f1": 0.8846153846153846,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8518518518518519,
"eval_PERSON_recall": 0.92,
"eval_QUANTITY_f1": 0.6461538461538462,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.5833333333333334,
"eval_QUANTITY_recall": 0.7241379310344828,
"eval_TIME_f1": 0.8648648648648648,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.8,
"eval_TIME_recall": 0.9411764705882353,
"eval_loss": 0.1336318403482437,
"eval_overall_accuracy": 0.9584051193699237,
"eval_overall_f1": 0.8068783068783069,
"eval_overall_precision": 0.7530864197530864,
"eval_overall_recall": 0.8689458689458689,
"eval_runtime": 0.3724,
"eval_samples_per_second": 502.143,
"eval_steps_per_second": 8.056,
"step": 4876
},
{
"epoch": 47.0,
"grad_norm": 1.561812162399292,
"learning_rate": 2.6500000000000004e-05,
"loss": 0.0896,
"step": 4982
},
{
"epoch": 47.0,
"eval_LOCATION_f1": 0.7770700636942677,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.7261904761904762,
"eval_LOCATION_recall": 0.8356164383561644,
"eval_ORGANIZATION_f1": 0.7,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.5894736842105263,
"eval_ORGANIZATION_recall": 0.8615384615384616,
"eval_PERSON_f1": 0.8853503184713376,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8475609756097561,
"eval_PERSON_recall": 0.9266666666666666,
"eval_QUANTITY_f1": 0.7076923076923076,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.6388888888888888,
"eval_QUANTITY_recall": 0.7931034482758621,
"eval_TIME_f1": 0.8421052631578947,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.7619047619047619,
"eval_TIME_recall": 0.9411764705882353,
"eval_loss": 0.14269451797008514,
"eval_overall_accuracy": 0.9561900073837066,
"eval_overall_f1": 0.805699481865285,
"eval_overall_precision": 0.7387173396674585,
"eval_overall_recall": 0.886039886039886,
"eval_runtime": 0.3722,
"eval_samples_per_second": 502.433,
"eval_steps_per_second": 8.06,
"step": 4982
},
{
"epoch": 48.0,
"grad_norm": 3.845472812652588,
"learning_rate": 2.6000000000000002e-05,
"loss": 0.0897,
"step": 5088
},
{
"epoch": 48.0,
"eval_LOCATION_f1": 0.7672955974842768,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.7093023255813954,
"eval_LOCATION_recall": 0.8356164383561644,
"eval_ORGANIZATION_f1": 0.7019867549668873,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6162790697674418,
"eval_ORGANIZATION_recall": 0.8153846153846154,
"eval_PERSON_f1": 0.8825396825396825,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8424242424242424,
"eval_PERSON_recall": 0.9266666666666666,
"eval_QUANTITY_f1": 0.676470588235294,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.5897435897435898,
"eval_QUANTITY_recall": 0.7931034482758621,
"eval_TIME_f1": 0.8157894736842106,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.7380952380952381,
"eval_TIME_recall": 0.9117647058823529,
"eval_loss": 0.1460731029510498,
"eval_overall_accuracy": 0.9549593896135861,
"eval_overall_f1": 0.7984395318595578,
"eval_overall_precision": 0.7344497607655502,
"eval_overall_recall": 0.8746438746438746,
"eval_runtime": 0.3721,
"eval_samples_per_second": 502.528,
"eval_steps_per_second": 8.062,
"step": 5088
},
{
"epoch": 49.0,
"grad_norm": 0.42411187291145325,
"learning_rate": 2.5500000000000003e-05,
"loss": 0.0836,
"step": 5194
},
{
"epoch": 49.0,
"eval_LOCATION_f1": 0.7770700636942677,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.7261904761904762,
"eval_LOCATION_recall": 0.8356164383561644,
"eval_ORGANIZATION_f1": 0.6838709677419356,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.5888888888888889,
"eval_ORGANIZATION_recall": 0.8153846153846154,
"eval_PERSON_f1": 0.8846153846153846,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8518518518518519,
"eval_PERSON_recall": 0.92,
"eval_QUANTITY_f1": 0.696969696969697,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.6216216216216216,
"eval_QUANTITY_recall": 0.7931034482758621,
"eval_TIME_f1": 0.8,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.7317073170731707,
"eval_TIME_recall": 0.8823529411764706,
"eval_loss": 0.14366112649440765,
"eval_overall_accuracy": 0.9552055131676102,
"eval_overall_f1": 0.7973856209150327,
"eval_overall_precision": 0.7367149758454107,
"eval_overall_recall": 0.8689458689458689,
"eval_runtime": 0.3738,
"eval_samples_per_second": 500.237,
"eval_steps_per_second": 8.025,
"step": 5194
},
{
"epoch": 50.0,
"grad_norm": 1.5665122270584106,
"learning_rate": 2.5e-05,
"loss": 0.0845,
"step": 5300
},
{
"epoch": 50.0,
"eval_LOCATION_f1": 0.7770700636942677,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.7261904761904762,
"eval_LOCATION_recall": 0.8356164383561644,
"eval_ORGANIZATION_f1": 0.7051282051282052,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6043956043956044,
"eval_ORGANIZATION_recall": 0.8461538461538461,
"eval_PERSON_f1": 0.8817891373801918,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8466257668711656,
"eval_PERSON_recall": 0.92,
"eval_QUANTITY_f1": 0.6666666666666667,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.5945945945945946,
"eval_QUANTITY_recall": 0.7586206896551724,
"eval_TIME_f1": 0.8378378378378379,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.775,
"eval_TIME_recall": 0.9117647058823529,
"eval_loss": 0.14279314875602722,
"eval_overall_accuracy": 0.9552055131676102,
"eval_overall_f1": 0.8015665796344648,
"eval_overall_precision": 0.7397590361445783,
"eval_overall_recall": 0.8746438746438746,
"eval_runtime": 0.3776,
"eval_samples_per_second": 495.202,
"eval_steps_per_second": 7.944,
"step": 5300
},
{
"epoch": 51.0,
"grad_norm": 0.8180804252624512,
"learning_rate": 2.45e-05,
"loss": 0.0849,
"step": 5406
},
{
"epoch": 51.0,
"eval_LOCATION_f1": 0.7870967741935484,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.7439024390243902,
"eval_LOCATION_recall": 0.8356164383561644,
"eval_ORGANIZATION_f1": 0.6973684210526315,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6091954022988506,
"eval_ORGANIZATION_recall": 0.8153846153846154,
"eval_PERSON_f1": 0.8817891373801918,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8466257668711656,
"eval_PERSON_recall": 0.92,
"eval_QUANTITY_f1": 0.6666666666666667,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.5945945945945946,
"eval_QUANTITY_recall": 0.7586206896551724,
"eval_TIME_f1": 0.8378378378378379,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.775,
"eval_TIME_recall": 0.9117647058823529,
"eval_loss": 0.1387655884027481,
"eval_overall_accuracy": 0.9564361309377307,
"eval_overall_f1": 0.8026315789473685,
"eval_overall_precision": 0.7457212713936431,
"eval_overall_recall": 0.8689458689458689,
"eval_runtime": 0.377,
"eval_samples_per_second": 496.079,
"eval_steps_per_second": 7.958,
"step": 5406
},
{
"epoch": 52.0,
"grad_norm": 2.047976016998291,
"learning_rate": 2.4e-05,
"loss": 0.0836,
"step": 5512
},
{
"epoch": 52.0,
"eval_LOCATION_f1": 0.7672955974842768,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.7093023255813954,
"eval_LOCATION_recall": 0.8356164383561644,
"eval_ORGANIZATION_f1": 0.7019867549668873,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6162790697674418,
"eval_ORGANIZATION_recall": 0.8153846153846154,
"eval_PERSON_f1": 0.8846153846153846,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8518518518518519,
"eval_PERSON_recall": 0.92,
"eval_QUANTITY_f1": 0.6865671641791046,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.6052631578947368,
"eval_QUANTITY_recall": 0.7931034482758621,
"eval_TIME_f1": 0.8266666666666665,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.7560975609756098,
"eval_TIME_recall": 0.9117647058823529,
"eval_loss": 0.14351429045200348,
"eval_overall_accuracy": 0.9554516367216342,
"eval_overall_f1": 0.8010471204188482,
"eval_overall_precision": 0.7409200968523002,
"eval_overall_recall": 0.8717948717948718,
"eval_runtime": 0.3744,
"eval_samples_per_second": 499.405,
"eval_steps_per_second": 8.012,
"step": 5512
},
{
"epoch": 53.0,
"grad_norm": 1.9604336023330688,
"learning_rate": 2.35e-05,
"loss": 0.0838,
"step": 5618
},
{
"epoch": 53.0,
"eval_LOCATION_f1": 0.7625000000000001,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.7011494252873564,
"eval_LOCATION_recall": 0.8356164383561644,
"eval_ORGANIZATION_f1": 0.6835443037974683,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.5806451612903226,
"eval_ORGANIZATION_recall": 0.8307692307692308,
"eval_PERSON_f1": 0.8789808917197452,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8414634146341463,
"eval_PERSON_recall": 0.92,
"eval_QUANTITY_f1": 0.6666666666666666,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.575,
"eval_QUANTITY_recall": 0.7931034482758621,
"eval_TIME_f1": 0.8,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.7317073170731707,
"eval_TIME_recall": 0.8823529411764706,
"eval_loss": 0.14942599833011627,
"eval_overall_accuracy": 0.9527442776273689,
"eval_overall_f1": 0.788659793814433,
"eval_overall_precision": 0.72,
"eval_overall_recall": 0.8717948717948718,
"eval_runtime": 0.3783,
"eval_samples_per_second": 494.359,
"eval_steps_per_second": 7.931,
"step": 5618
},
{
"epoch": 54.0,
"grad_norm": 1.6018130779266357,
"learning_rate": 2.3000000000000003e-05,
"loss": 0.0811,
"step": 5724
},
{
"epoch": 54.0,
"eval_LOCATION_f1": 0.7654320987654321,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.6966292134831461,
"eval_LOCATION_recall": 0.8493150684931506,
"eval_ORGANIZATION_f1": 0.6962025316455697,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.5913978494623656,
"eval_ORGANIZATION_recall": 0.8461538461538461,
"eval_PERSON_f1": 0.8817891373801918,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8466257668711656,
"eval_PERSON_recall": 0.92,
"eval_QUANTITY_f1": 0.7272727272727273,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.6486486486486487,
"eval_QUANTITY_recall": 0.8275862068965517,
"eval_TIME_f1": 0.8266666666666665,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.7560975609756098,
"eval_TIME_recall": 0.9117647058823529,
"eval_loss": 0.14617691934108734,
"eval_overall_accuracy": 0.9556977602756583,
"eval_overall_f1": 0.8010335917312662,
"eval_overall_precision": 0.7328605200945626,
"eval_overall_recall": 0.8831908831908832,
"eval_runtime": 0.3727,
"eval_samples_per_second": 501.802,
"eval_steps_per_second": 8.05,
"step": 5724
},
{
"epoch": 55.0,
"grad_norm": 1.0216081142425537,
"learning_rate": 2.25e-05,
"loss": 0.0826,
"step": 5830
},
{
"epoch": 55.0,
"eval_LOCATION_f1": 0.7770700636942677,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.7261904761904762,
"eval_LOCATION_recall": 0.8356164383561644,
"eval_ORGANIZATION_f1": 0.6666666666666666,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.5714285714285714,
"eval_ORGANIZATION_recall": 0.8,
"eval_PERSON_f1": 0.8817891373801918,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8466257668711656,
"eval_PERSON_recall": 0.92,
"eval_QUANTITY_f1": 0.6865671641791046,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.6052631578947368,
"eval_QUANTITY_recall": 0.7931034482758621,
"eval_TIME_f1": 0.8266666666666665,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.7560975609756098,
"eval_TIME_recall": 0.9117647058823529,
"eval_loss": 0.14629320800304413,
"eval_overall_accuracy": 0.9534826482894413,
"eval_overall_f1": 0.7942708333333333,
"eval_overall_precision": 0.7314148681055156,
"eval_overall_recall": 0.8689458689458689,
"eval_runtime": 0.373,
"eval_samples_per_second": 501.397,
"eval_steps_per_second": 8.044,
"step": 5830
},
{
"epoch": 56.0,
"grad_norm": 1.5277239084243774,
"learning_rate": 2.2000000000000003e-05,
"loss": 0.0818,
"step": 5936
},
{
"epoch": 56.0,
"eval_LOCATION_f1": 0.7898089171974523,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.7380952380952381,
"eval_LOCATION_recall": 0.8493150684931506,
"eval_ORGANIZATION_f1": 0.6794871794871795,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.5824175824175825,
"eval_ORGANIZATION_recall": 0.8153846153846154,
"eval_PERSON_f1": 0.8789808917197452,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8414634146341463,
"eval_PERSON_recall": 0.92,
"eval_QUANTITY_f1": 0.696969696969697,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.6216216216216216,
"eval_QUANTITY_recall": 0.7931034482758621,
"eval_TIME_f1": 0.8378378378378379,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.775,
"eval_TIME_recall": 0.9117647058823529,
"eval_loss": 0.14746278524398804,
"eval_overall_accuracy": 0.9554516367216342,
"eval_overall_f1": 0.8005215123859191,
"eval_overall_precision": 0.7379807692307693,
"eval_overall_recall": 0.8746438746438746,
"eval_runtime": 0.3747,
"eval_samples_per_second": 499.009,
"eval_steps_per_second": 8.005,
"step": 5936
},
{
"epoch": 57.0,
"grad_norm": 1.1813913583755493,
"learning_rate": 2.15e-05,
"loss": 0.0833,
"step": 6042
},
{
"epoch": 57.0,
"eval_LOCATION_f1": 0.7692307692307693,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.7228915662650602,
"eval_LOCATION_recall": 0.821917808219178,
"eval_ORGANIZATION_f1": 0.6792452830188681,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.574468085106383,
"eval_ORGANIZATION_recall": 0.8307692307692308,
"eval_PERSON_f1": 0.8734177215189873,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8313253012048193,
"eval_PERSON_recall": 0.92,
"eval_QUANTITY_f1": 0.6865671641791046,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.6052631578947368,
"eval_QUANTITY_recall": 0.7931034482758621,
"eval_TIME_f1": 0.8266666666666665,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.7560975609756098,
"eval_TIME_recall": 0.9117647058823529,
"eval_loss": 0.1485372930765152,
"eval_overall_accuracy": 0.9529904011813931,
"eval_overall_f1": 0.7917205692108668,
"eval_overall_precision": 0.7251184834123223,
"eval_overall_recall": 0.8717948717948718,
"eval_runtime": 0.3727,
"eval_samples_per_second": 501.711,
"eval_steps_per_second": 8.049,
"step": 6042
},
{
"epoch": 58.0,
"grad_norm": 0.640755295753479,
"learning_rate": 2.1e-05,
"loss": 0.0798,
"step": 6148
},
{
"epoch": 58.0,
"eval_LOCATION_f1": 0.7692307692307693,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.7228915662650602,
"eval_LOCATION_recall": 0.821917808219178,
"eval_ORGANIZATION_f1": 0.697986577181208,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6190476190476191,
"eval_ORGANIZATION_recall": 0.8,
"eval_PERSON_f1": 0.887459807073955,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8571428571428571,
"eval_PERSON_recall": 0.92,
"eval_QUANTITY_f1": 0.71875,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.6571428571428571,
"eval_QUANTITY_recall": 0.7931034482758621,
"eval_TIME_f1": 0.8378378378378379,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.775,
"eval_TIME_recall": 0.9117647058823529,
"eval_loss": 0.14086660742759705,
"eval_overall_accuracy": 0.9564361309377307,
"eval_overall_f1": 0.8063660477453581,
"eval_overall_precision": 0.7543424317617866,
"eval_overall_recall": 0.8660968660968661,
"eval_runtime": 0.3766,
"eval_samples_per_second": 496.571,
"eval_steps_per_second": 7.966,
"step": 6148
},
{
"epoch": 59.0,
"grad_norm": 2.363363265991211,
"learning_rate": 2.05e-05,
"loss": 0.0802,
"step": 6254
},
{
"epoch": 59.0,
"eval_LOCATION_f1": 0.7770700636942677,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.7261904761904762,
"eval_LOCATION_recall": 0.8356164383561644,
"eval_ORGANIZATION_f1": 0.6883116883116883,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.5955056179775281,
"eval_ORGANIZATION_recall": 0.8153846153846154,
"eval_PERSON_f1": 0.887459807073955,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8571428571428571,
"eval_PERSON_recall": 0.92,
"eval_QUANTITY_f1": 0.7076923076923076,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.6388888888888888,
"eval_QUANTITY_recall": 0.7931034482758621,
"eval_TIME_f1": 0.8266666666666665,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.7560975609756098,
"eval_TIME_recall": 0.9117647058823529,
"eval_loss": 0.14503292739391327,
"eval_overall_accuracy": 0.9556977602756583,
"eval_overall_f1": 0.8031496062992126,
"eval_overall_precision": 0.7445255474452555,
"eval_overall_recall": 0.8717948717948718,
"eval_runtime": 0.374,
"eval_samples_per_second": 499.944,
"eval_steps_per_second": 8.02,
"step": 6254
},
{
"epoch": 60.0,
"grad_norm": 1.6086369752883911,
"learning_rate": 2e-05,
"loss": 0.08,
"step": 6360
},
{
"epoch": 60.0,
"eval_LOCATION_f1": 0.7999999999999999,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.7560975609756098,
"eval_LOCATION_recall": 0.8493150684931506,
"eval_ORGANIZATION_f1": 0.7019867549668873,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6162790697674418,
"eval_ORGANIZATION_recall": 0.8153846153846154,
"eval_PERSON_f1": 0.887459807073955,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8571428571428571,
"eval_PERSON_recall": 0.92,
"eval_QUANTITY_f1": 0.6875,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.6285714285714286,
"eval_QUANTITY_recall": 0.7586206896551724,
"eval_TIME_f1": 0.8533333333333334,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.7804878048780488,
"eval_TIME_recall": 0.9411764705882353,
"eval_loss": 0.1365276426076889,
"eval_overall_accuracy": 0.9591434900319961,
"eval_overall_f1": 0.8121693121693121,
"eval_overall_precision": 0.7580246913580246,
"eval_overall_recall": 0.8746438746438746,
"eval_runtime": 0.3728,
"eval_samples_per_second": 501.578,
"eval_steps_per_second": 8.047,
"step": 6360
},
{
"epoch": 61.0,
"grad_norm": 1.1481249332427979,
"learning_rate": 1.9500000000000003e-05,
"loss": 0.0792,
"step": 6466
},
{
"epoch": 61.0,
"eval_LOCATION_f1": 0.7692307692307693,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.7228915662650602,
"eval_LOCATION_recall": 0.821917808219178,
"eval_ORGANIZATION_f1": 0.7152317880794703,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.627906976744186,
"eval_ORGANIZATION_recall": 0.8307692307692308,
"eval_PERSON_f1": 0.8846153846153846,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8518518518518519,
"eval_PERSON_recall": 0.92,
"eval_QUANTITY_f1": 0.6875,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.6285714285714286,
"eval_QUANTITY_recall": 0.7586206896551724,
"eval_TIME_f1": 0.8533333333333334,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.7804878048780488,
"eval_TIME_recall": 0.9411764705882353,
"eval_loss": 0.13838407397270203,
"eval_overall_accuracy": 0.9576667487078513,
"eval_overall_f1": 0.8073878627968336,
"eval_overall_precision": 0.7518427518427518,
"eval_overall_recall": 0.8717948717948718,
"eval_runtime": 0.3773,
"eval_samples_per_second": 495.651,
"eval_steps_per_second": 7.952,
"step": 6466
},
{
"epoch": 62.0,
"grad_norm": 1.3433496952056885,
"learning_rate": 1.9e-05,
"loss": 0.0776,
"step": 6572
},
{
"epoch": 62.0,
"eval_LOCATION_f1": 0.7692307692307693,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.7228915662650602,
"eval_LOCATION_recall": 0.821917808219178,
"eval_ORGANIZATION_f1": 0.7222222222222222,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6582278481012658,
"eval_ORGANIZATION_recall": 0.8,
"eval_PERSON_f1": 0.8846153846153846,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8518518518518519,
"eval_PERSON_recall": 0.92,
"eval_QUANTITY_f1": 0.696969696969697,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.6216216216216216,
"eval_QUANTITY_recall": 0.7931034482758621,
"eval_TIME_f1": 0.8421052631578947,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.7619047619047619,
"eval_TIME_recall": 0.9411764705882353,
"eval_loss": 0.14121700823307037,
"eval_overall_accuracy": 0.9576667487078513,
"eval_overall_f1": 0.8090185676392573,
"eval_overall_precision": 0.7568238213399504,
"eval_overall_recall": 0.8689458689458689,
"eval_runtime": 0.3749,
"eval_samples_per_second": 498.784,
"eval_steps_per_second": 8.002,
"step": 6572
},
{
"epoch": 63.0,
"grad_norm": 2.4079196453094482,
"learning_rate": 1.85e-05,
"loss": 0.0782,
"step": 6678
},
{
"epoch": 63.0,
"eval_LOCATION_f1": 0.7770700636942677,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.7261904761904762,
"eval_LOCATION_recall": 0.8356164383561644,
"eval_ORGANIZATION_f1": 0.6878980891719746,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.5869565217391305,
"eval_ORGANIZATION_recall": 0.8307692307692308,
"eval_PERSON_f1": 0.887459807073955,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8571428571428571,
"eval_PERSON_recall": 0.92,
"eval_QUANTITY_f1": 0.7076923076923076,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.6388888888888888,
"eval_QUANTITY_recall": 0.7931034482758621,
"eval_TIME_f1": 0.8421052631578947,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.7619047619047619,
"eval_TIME_recall": 0.9411764705882353,
"eval_loss": 0.1416482925415039,
"eval_overall_accuracy": 0.9554516367216342,
"eval_overall_f1": 0.804177545691906,
"eval_overall_precision": 0.7421686746987952,
"eval_overall_recall": 0.8774928774928775,
"eval_runtime": 0.3756,
"eval_samples_per_second": 497.871,
"eval_steps_per_second": 7.987,
"step": 6678
},
{
"epoch": 64.0,
"grad_norm": 0.9945477247238159,
"learning_rate": 1.8e-05,
"loss": 0.0789,
"step": 6784
},
{
"epoch": 64.0,
"eval_LOCATION_f1": 0.7770700636942677,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.7261904761904762,
"eval_LOCATION_recall": 0.8356164383561644,
"eval_ORGANIZATION_f1": 0.7123287671232877,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6419753086419753,
"eval_ORGANIZATION_recall": 0.8,
"eval_PERSON_f1": 0.887459807073955,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8571428571428571,
"eval_PERSON_recall": 0.92,
"eval_QUANTITY_f1": 0.6875,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.6285714285714286,
"eval_QUANTITY_recall": 0.7586206896551724,
"eval_TIME_f1": 0.8421052631578947,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.7619047619047619,
"eval_TIME_recall": 0.9411764705882353,
"eval_loss": 0.13378003239631653,
"eval_overall_accuracy": 0.9581589958158996,
"eval_overall_f1": 0.8090185676392573,
"eval_overall_precision": 0.7568238213399504,
"eval_overall_recall": 0.8689458689458689,
"eval_runtime": 0.3716,
"eval_samples_per_second": 503.164,
"eval_steps_per_second": 8.072,
"step": 6784
},
{
"epoch": 65.0,
"grad_norm": 1.0777437686920166,
"learning_rate": 1.75e-05,
"loss": 0.0769,
"step": 6890
},
{
"epoch": 65.0,
"eval_LOCATION_f1": 0.7721518987341772,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.7176470588235294,
"eval_LOCATION_recall": 0.8356164383561644,
"eval_ORGANIZATION_f1": 0.7123287671232877,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6419753086419753,
"eval_ORGANIZATION_recall": 0.8,
"eval_PERSON_f1": 0.887459807073955,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8571428571428571,
"eval_PERSON_recall": 0.92,
"eval_QUANTITY_f1": 0.7076923076923076,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.6388888888888888,
"eval_QUANTITY_recall": 0.7931034482758621,
"eval_TIME_f1": 0.8266666666666665,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.7560975609756098,
"eval_TIME_recall": 0.9117647058823529,
"eval_loss": 0.13960254192352295,
"eval_overall_accuracy": 0.9579128722618755,
"eval_overall_f1": 0.8079470198675496,
"eval_overall_precision": 0.754950495049505,
"eval_overall_recall": 0.8689458689458689,
"eval_runtime": 0.3755,
"eval_samples_per_second": 497.937,
"eval_steps_per_second": 7.988,
"step": 6890
},
{
"epoch": 66.0,
"grad_norm": 0.8647677302360535,
"learning_rate": 1.7000000000000003e-05,
"loss": 0.0757,
"step": 6996
},
{
"epoch": 66.0,
"eval_LOCATION_f1": 0.7770700636942677,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.7261904761904762,
"eval_LOCATION_recall": 0.8356164383561644,
"eval_ORGANIZATION_f1": 0.7019867549668873,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6162790697674418,
"eval_ORGANIZATION_recall": 0.8153846153846154,
"eval_PERSON_f1": 0.8846153846153846,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8518518518518519,
"eval_PERSON_recall": 0.92,
"eval_QUANTITY_f1": 0.676923076923077,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.6111111111111112,
"eval_QUANTITY_recall": 0.7586206896551724,
"eval_TIME_f1": 0.8421052631578947,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.7619047619047619,
"eval_TIME_recall": 0.9411764705882353,
"eval_loss": 0.1402267962694168,
"eval_overall_accuracy": 0.9576667487078513,
"eval_overall_f1": 0.8042049934296978,
"eval_overall_precision": 0.7463414634146341,
"eval_overall_recall": 0.8717948717948718,
"eval_runtime": 0.3717,
"eval_samples_per_second": 503.11,
"eval_steps_per_second": 8.071,
"step": 6996
},
{
"epoch": 67.0,
"grad_norm": 1.0575724840164185,
"learning_rate": 1.65e-05,
"loss": 0.0753,
"step": 7102
},
{
"epoch": 67.0,
"eval_LOCATION_f1": 0.7820512820512822,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.7349397590361446,
"eval_LOCATION_recall": 0.8356164383561644,
"eval_ORGANIZATION_f1": 0.7210884353741497,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6463414634146342,
"eval_ORGANIZATION_recall": 0.8153846153846154,
"eval_PERSON_f1": 0.887459807073955,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8571428571428571,
"eval_PERSON_recall": 0.92,
"eval_QUANTITY_f1": 0.7076923076923076,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.6388888888888888,
"eval_QUANTITY_recall": 0.7931034482758621,
"eval_TIME_f1": 0.8533333333333334,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.7804878048780488,
"eval_TIME_recall": 0.9411764705882353,
"eval_loss": 0.13897380232810974,
"eval_overall_accuracy": 0.9593896135860202,
"eval_overall_f1": 0.8143236074270558,
"eval_overall_precision": 0.7617866004962779,
"eval_overall_recall": 0.8746438746438746,
"eval_runtime": 0.3722,
"eval_samples_per_second": 502.482,
"eval_steps_per_second": 8.061,
"step": 7102
},
{
"epoch": 68.0,
"grad_norm": 0.9653581976890564,
"learning_rate": 1.6000000000000003e-05,
"loss": 0.0757,
"step": 7208
},
{
"epoch": 68.0,
"eval_LOCATION_f1": 0.7870967741935484,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.7439024390243902,
"eval_LOCATION_recall": 0.8356164383561644,
"eval_ORGANIZATION_f1": 0.7172413793103448,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.65,
"eval_ORGANIZATION_recall": 0.8,
"eval_PERSON_f1": 0.887459807073955,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8571428571428571,
"eval_PERSON_recall": 0.92,
"eval_QUANTITY_f1": 0.7076923076923076,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.6388888888888888,
"eval_QUANTITY_recall": 0.7931034482758621,
"eval_TIME_f1": 0.8533333333333334,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.7804878048780488,
"eval_TIME_recall": 0.9411764705882353,
"eval_loss": 0.13793830573558807,
"eval_overall_accuracy": 0.9591434900319961,
"eval_overall_f1": 0.8149134487350199,
"eval_overall_precision": 0.765,
"eval_overall_recall": 0.8717948717948718,
"eval_runtime": 0.3738,
"eval_samples_per_second": 500.215,
"eval_steps_per_second": 8.025,
"step": 7208
},
{
"epoch": 69.0,
"grad_norm": 1.3589030504226685,
"learning_rate": 1.55e-05,
"loss": 0.0731,
"step": 7314
},
{
"epoch": 69.0,
"eval_LOCATION_f1": 0.7770700636942677,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.7261904761904762,
"eval_LOCATION_recall": 0.8356164383561644,
"eval_ORGANIZATION_f1": 0.7320261437908497,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6363636363636364,
"eval_ORGANIZATION_recall": 0.8615384615384616,
"eval_PERSON_f1": 0.887459807073955,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8571428571428571,
"eval_PERSON_recall": 0.92,
"eval_QUANTITY_f1": 0.71875,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.6571428571428571,
"eval_QUANTITY_recall": 0.7931034482758621,
"eval_TIME_f1": 0.8533333333333334,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.7804878048780488,
"eval_TIME_recall": 0.9411764705882353,
"eval_loss": 0.14166338741779327,
"eval_overall_accuracy": 0.9581589958158996,
"eval_overall_f1": 0.8157894736842105,
"eval_overall_precision": 0.7579462102689487,
"eval_overall_recall": 0.8831908831908832,
"eval_runtime": 0.3735,
"eval_samples_per_second": 500.684,
"eval_steps_per_second": 8.032,
"step": 7314
},
{
"epoch": 70.0,
"grad_norm": 1.4494452476501465,
"learning_rate": 1.5e-05,
"loss": 0.0751,
"step": 7420
},
{
"epoch": 70.0,
"eval_LOCATION_f1": 0.7870967741935484,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.7439024390243902,
"eval_LOCATION_recall": 0.8356164383561644,
"eval_ORGANIZATION_f1": 0.7172413793103448,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.65,
"eval_ORGANIZATION_recall": 0.8,
"eval_PERSON_f1": 0.8903225806451613,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8625,
"eval_PERSON_recall": 0.92,
"eval_QUANTITY_f1": 0.6875,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.6285714285714286,
"eval_QUANTITY_recall": 0.7586206896551724,
"eval_TIME_f1": 0.8533333333333334,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.7804878048780488,
"eval_TIME_recall": 0.9411764705882353,
"eval_loss": 0.13516362011432648,
"eval_overall_accuracy": 0.9591434900319961,
"eval_overall_f1": 0.814419225634179,
"eval_overall_precision": 0.7663316582914573,
"eval_overall_recall": 0.8689458689458689,
"eval_runtime": 0.3728,
"eval_samples_per_second": 501.549,
"eval_steps_per_second": 8.046,
"step": 7420
},
{
"epoch": 71.0,
"grad_norm": 2.012171745300293,
"learning_rate": 1.45e-05,
"loss": 0.0755,
"step": 7526
},
{
"epoch": 71.0,
"eval_LOCATION_f1": 0.7820512820512822,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.7349397590361446,
"eval_LOCATION_recall": 0.8356164383561644,
"eval_ORGANIZATION_f1": 0.7189542483660131,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.625,
"eval_ORGANIZATION_recall": 0.8461538461538461,
"eval_PERSON_f1": 0.8846153846153846,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8518518518518519,
"eval_PERSON_recall": 0.92,
"eval_QUANTITY_f1": 0.696969696969697,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.6216216216216216,
"eval_QUANTITY_recall": 0.7931034482758621,
"eval_TIME_f1": 0.8421052631578947,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.7619047619047619,
"eval_TIME_recall": 0.9411764705882353,
"eval_loss": 0.14387430250644684,
"eval_overall_accuracy": 0.9576667487078513,
"eval_overall_f1": 0.8099606815203145,
"eval_overall_precision": 0.75,
"eval_overall_recall": 0.8803418803418803,
"eval_runtime": 0.3724,
"eval_samples_per_second": 502.104,
"eval_steps_per_second": 8.055,
"step": 7526
},
{
"epoch": 72.0,
"grad_norm": 1.370118498802185,
"learning_rate": 1.4000000000000001e-05,
"loss": 0.0745,
"step": 7632
},
{
"epoch": 72.0,
"eval_LOCATION_f1": 0.7770700636942677,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.7261904761904762,
"eval_LOCATION_recall": 0.8356164383561644,
"eval_ORGANIZATION_f1": 0.7123287671232877,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6419753086419753,
"eval_ORGANIZATION_recall": 0.8,
"eval_PERSON_f1": 0.8846153846153846,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8518518518518519,
"eval_PERSON_recall": 0.92,
"eval_QUANTITY_f1": 0.676923076923077,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.6111111111111112,
"eval_QUANTITY_recall": 0.7586206896551724,
"eval_TIME_f1": 0.8421052631578947,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.7619047619047619,
"eval_TIME_recall": 0.9411764705882353,
"eval_loss": 0.13974949717521667,
"eval_overall_accuracy": 0.9579128722618755,
"eval_overall_f1": 0.8068783068783069,
"eval_overall_precision": 0.7530864197530864,
"eval_overall_recall": 0.8689458689458689,
"eval_runtime": 0.3737,
"eval_samples_per_second": 500.351,
"eval_steps_per_second": 8.027,
"step": 7632
},
{
"epoch": 73.0,
"grad_norm": 0.621573805809021,
"learning_rate": 1.3500000000000001e-05,
"loss": 0.0746,
"step": 7738
},
{
"epoch": 73.0,
"eval_LOCATION_f1": 0.7792207792207793,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.7407407407407407,
"eval_LOCATION_recall": 0.821917808219178,
"eval_ORGANIZATION_f1": 0.7172413793103448,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.65,
"eval_ORGANIZATION_recall": 0.8,
"eval_PERSON_f1": 0.887459807073955,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8571428571428571,
"eval_PERSON_recall": 0.92,
"eval_QUANTITY_f1": 0.7076923076923076,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.6388888888888888,
"eval_QUANTITY_recall": 0.7931034482758621,
"eval_TIME_f1": 0.8533333333333334,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.7804878048780488,
"eval_TIME_recall": 0.9411764705882353,
"eval_loss": 0.1360926479101181,
"eval_overall_accuracy": 0.9591434900319961,
"eval_overall_f1": 0.8133333333333332,
"eval_overall_precision": 0.7644110275689223,
"eval_overall_recall": 0.8689458689458689,
"eval_runtime": 0.3745,
"eval_samples_per_second": 499.381,
"eval_steps_per_second": 8.011,
"step": 7738
},
{
"epoch": 74.0,
"grad_norm": 1.1147890090942383,
"learning_rate": 1.3000000000000001e-05,
"loss": 0.0727,
"step": 7844
},
{
"epoch": 74.0,
"eval_LOCATION_f1": 0.7870967741935484,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.7439024390243902,
"eval_LOCATION_recall": 0.8356164383561644,
"eval_ORGANIZATION_f1": 0.7172413793103448,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.65,
"eval_ORGANIZATION_recall": 0.8,
"eval_PERSON_f1": 0.887459807073955,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8571428571428571,
"eval_PERSON_recall": 0.92,
"eval_QUANTITY_f1": 0.6875,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.6285714285714286,
"eval_QUANTITY_recall": 0.7586206896551724,
"eval_TIME_f1": 0.8533333333333334,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.7804878048780488,
"eval_TIME_recall": 0.9411764705882353,
"eval_loss": 0.13560639321804047,
"eval_overall_accuracy": 0.9596357371400444,
"eval_overall_f1": 0.8133333333333332,
"eval_overall_precision": 0.7644110275689223,
"eval_overall_recall": 0.8689458689458689,
"eval_runtime": 0.374,
"eval_samples_per_second": 500.038,
"eval_steps_per_second": 8.022,
"step": 7844
},
{
"epoch": 75.0,
"grad_norm": 0.9206987619400024,
"learning_rate": 1.25e-05,
"loss": 0.0727,
"step": 7950
},
{
"epoch": 75.0,
"eval_LOCATION_f1": 0.7770700636942677,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.7261904761904762,
"eval_LOCATION_recall": 0.8356164383561644,
"eval_ORGANIZATION_f1": 0.7162162162162162,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6385542168674698,
"eval_ORGANIZATION_recall": 0.8153846153846154,
"eval_PERSON_f1": 0.887459807073955,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8571428571428571,
"eval_PERSON_recall": 0.92,
"eval_QUANTITY_f1": 0.7076923076923076,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.6388888888888888,
"eval_QUANTITY_recall": 0.7931034482758621,
"eval_TIME_f1": 0.8421052631578947,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.7619047619047619,
"eval_TIME_recall": 0.9411764705882353,
"eval_loss": 0.14432945847511292,
"eval_overall_accuracy": 0.9574206251538272,
"eval_overall_f1": 0.8110964332892999,
"eval_overall_precision": 0.7561576354679803,
"eval_overall_recall": 0.8746438746438746,
"eval_runtime": 0.374,
"eval_samples_per_second": 499.951,
"eval_steps_per_second": 8.021,
"step": 7950
},
{
"epoch": 76.0,
"grad_norm": 1.3934582471847534,
"learning_rate": 1.2e-05,
"loss": 0.073,
"step": 8056
},
{
"epoch": 76.0,
"eval_LOCATION_f1": 0.7770700636942677,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.7261904761904762,
"eval_LOCATION_recall": 0.8356164383561644,
"eval_ORGANIZATION_f1": 0.7012987012987013,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6067415730337079,
"eval_ORGANIZATION_recall": 0.8307692307692308,
"eval_PERSON_f1": 0.887459807073955,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8571428571428571,
"eval_PERSON_recall": 0.92,
"eval_QUANTITY_f1": 0.6875,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.6285714285714286,
"eval_QUANTITY_recall": 0.7586206896551724,
"eval_TIME_f1": 0.8,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.7317073170731707,
"eval_TIME_recall": 0.8823529411764706,
"eval_loss": 0.14394371211528778,
"eval_overall_accuracy": 0.9549593896135861,
"eval_overall_f1": 0.8015768725361366,
"eval_overall_precision": 0.7439024390243902,
"eval_overall_recall": 0.8689458689458689,
"eval_runtime": 0.3764,
"eval_samples_per_second": 496.875,
"eval_steps_per_second": 7.971,
"step": 8056
},
{
"epoch": 77.0,
"grad_norm": 1.3345227241516113,
"learning_rate": 1.1500000000000002e-05,
"loss": 0.0733,
"step": 8162
},
{
"epoch": 77.0,
"eval_LOCATION_f1": 0.7792207792207793,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.7407407407407407,
"eval_LOCATION_recall": 0.821917808219178,
"eval_ORGANIZATION_f1": 0.7310344827586207,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6625,
"eval_ORGANIZATION_recall": 0.8153846153846154,
"eval_PERSON_f1": 0.887459807073955,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8571428571428571,
"eval_PERSON_recall": 0.92,
"eval_QUANTITY_f1": 0.6875,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.6285714285714286,
"eval_QUANTITY_recall": 0.7586206896551724,
"eval_TIME_f1": 0.8266666666666665,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.7560975609756098,
"eval_TIME_recall": 0.9117647058823529,
"eval_loss": 0.13728104531764984,
"eval_overall_accuracy": 0.9593896135860202,
"eval_overall_f1": 0.8117489986648865,
"eval_overall_precision": 0.7638190954773869,
"eval_overall_recall": 0.8660968660968661,
"eval_runtime": 0.3706,
"eval_samples_per_second": 504.552,
"eval_steps_per_second": 8.094,
"step": 8162
},
{
"epoch": 78.0,
"grad_norm": 1.4736689329147339,
"learning_rate": 1.1000000000000001e-05,
"loss": 0.072,
"step": 8268
},
{
"epoch": 78.0,
"eval_LOCATION_f1": 0.7870967741935484,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.7439024390243902,
"eval_LOCATION_recall": 0.8356164383561644,
"eval_ORGANIZATION_f1": 0.726027397260274,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.654320987654321,
"eval_ORGANIZATION_recall": 0.8153846153846154,
"eval_PERSON_f1": 0.887459807073955,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8571428571428571,
"eval_PERSON_recall": 0.92,
"eval_QUANTITY_f1": 0.7076923076923076,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.6388888888888888,
"eval_QUANTITY_recall": 0.7931034482758621,
"eval_TIME_f1": 0.8421052631578947,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.7619047619047619,
"eval_TIME_recall": 0.9411764705882353,
"eval_loss": 0.14146719872951508,
"eval_overall_accuracy": 0.9581589958158996,
"eval_overall_f1": 0.8154050464807436,
"eval_overall_precision": 0.763681592039801,
"eval_overall_recall": 0.8746438746438746,
"eval_runtime": 0.3724,
"eval_samples_per_second": 502.127,
"eval_steps_per_second": 8.056,
"step": 8268
},
{
"epoch": 79.0,
"grad_norm": 0.9665191769599915,
"learning_rate": 1.05e-05,
"loss": 0.0718,
"step": 8374
},
{
"epoch": 79.0,
"eval_LOCATION_f1": 0.7721518987341772,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.7176470588235294,
"eval_LOCATION_recall": 0.8356164383561644,
"eval_ORGANIZATION_f1": 0.717948717948718,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6153846153846154,
"eval_ORGANIZATION_recall": 0.8615384615384616,
"eval_PERSON_f1": 0.8817891373801918,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8466257668711656,
"eval_PERSON_recall": 0.92,
"eval_QUANTITY_f1": 0.7076923076923076,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.6388888888888888,
"eval_QUANTITY_recall": 0.7931034482758621,
"eval_TIME_f1": 0.8,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.7317073170731707,
"eval_TIME_recall": 0.8823529411764706,
"eval_loss": 0.14953278005123138,
"eval_overall_accuracy": 0.9552055131676102,
"eval_overall_f1": 0.8031290743155151,
"eval_overall_precision": 0.7403846153846154,
"eval_overall_recall": 0.8774928774928775,
"eval_runtime": 0.3713,
"eval_samples_per_second": 503.668,
"eval_steps_per_second": 8.08,
"step": 8374
},
{
"epoch": 80.0,
"grad_norm": 0.4756767153739929,
"learning_rate": 1e-05,
"loss": 0.0703,
"step": 8480
},
{
"epoch": 80.0,
"eval_LOCATION_f1": 0.7820512820512822,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.7349397590361446,
"eval_LOCATION_recall": 0.8356164383561644,
"eval_ORGANIZATION_f1": 0.7432432432432433,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6626506024096386,
"eval_ORGANIZATION_recall": 0.8461538461538461,
"eval_PERSON_f1": 0.8817891373801918,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8466257668711656,
"eval_PERSON_recall": 0.92,
"eval_QUANTITY_f1": 0.7076923076923076,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.6388888888888888,
"eval_QUANTITY_recall": 0.7931034482758621,
"eval_TIME_f1": 0.8,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.7317073170731707,
"eval_TIME_recall": 0.8823529411764706,
"eval_loss": 0.14299984276294708,
"eval_overall_accuracy": 0.9571745015998031,
"eval_overall_f1": 0.8110964332892999,
"eval_overall_precision": 0.7561576354679803,
"eval_overall_recall": 0.8746438746438746,
"eval_runtime": 0.3781,
"eval_samples_per_second": 494.608,
"eval_steps_per_second": 7.935,
"step": 8480
},
{
"epoch": 81.0,
"grad_norm": 0.7018587589263916,
"learning_rate": 9.5e-06,
"loss": 0.0702,
"step": 8586
},
{
"epoch": 81.0,
"eval_LOCATION_f1": 0.7820512820512822,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.7349397590361446,
"eval_LOCATION_recall": 0.8356164383561644,
"eval_ORGANIZATION_f1": 0.7432432432432433,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6626506024096386,
"eval_ORGANIZATION_recall": 0.8461538461538461,
"eval_PERSON_f1": 0.887459807073955,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8571428571428571,
"eval_PERSON_recall": 0.92,
"eval_QUANTITY_f1": 0.71875,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.6571428571428571,
"eval_QUANTITY_recall": 0.7931034482758621,
"eval_TIME_f1": 0.8,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.7317073170731707,
"eval_TIME_recall": 0.8823529411764706,
"eval_loss": 0.14150598645210266,
"eval_overall_accuracy": 0.9584051193699237,
"eval_overall_f1": 0.8143236074270558,
"eval_overall_precision": 0.7617866004962779,
"eval_overall_recall": 0.8746438746438746,
"eval_runtime": 0.3737,
"eval_samples_per_second": 500.383,
"eval_steps_per_second": 8.028,
"step": 8586
},
{
"epoch": 82.0,
"grad_norm": 1.6355091333389282,
"learning_rate": 9e-06,
"loss": 0.0721,
"step": 8692
},
{
"epoch": 82.0,
"eval_LOCATION_f1": 0.7820512820512822,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.7349397590361446,
"eval_LOCATION_recall": 0.8356164383561644,
"eval_ORGANIZATION_f1": 0.7432432432432433,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6626506024096386,
"eval_ORGANIZATION_recall": 0.8461538461538461,
"eval_PERSON_f1": 0.887459807073955,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8571428571428571,
"eval_PERSON_recall": 0.92,
"eval_QUANTITY_f1": 0.71875,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.6571428571428571,
"eval_QUANTITY_recall": 0.7931034482758621,
"eval_TIME_f1": 0.8266666666666665,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.7560975609756098,
"eval_TIME_recall": 0.9117647058823529,
"eval_loss": 0.14245130121707916,
"eval_overall_accuracy": 0.958897366477972,
"eval_overall_f1": 0.8169761273209548,
"eval_overall_precision": 0.7642679900744417,
"eval_overall_recall": 0.8774928774928775,
"eval_runtime": 0.3741,
"eval_samples_per_second": 499.836,
"eval_steps_per_second": 8.019,
"step": 8692
},
{
"epoch": 83.0,
"grad_norm": 0.8933713436126709,
"learning_rate": 8.500000000000002e-06,
"loss": 0.0712,
"step": 8798
},
{
"epoch": 83.0,
"eval_LOCATION_f1": 0.7770700636942677,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.7261904761904762,
"eval_LOCATION_recall": 0.8356164383561644,
"eval_ORGANIZATION_f1": 0.7432432432432433,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6626506024096386,
"eval_ORGANIZATION_recall": 0.8461538461538461,
"eval_PERSON_f1": 0.887459807073955,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8571428571428571,
"eval_PERSON_recall": 0.92,
"eval_QUANTITY_f1": 0.71875,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.6571428571428571,
"eval_QUANTITY_recall": 0.7931034482758621,
"eval_TIME_f1": 0.8421052631578947,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.7619047619047619,
"eval_TIME_recall": 0.9411764705882353,
"eval_loss": 0.1438244879245758,
"eval_overall_accuracy": 0.9586512429239479,
"eval_overall_f1": 0.8174603174603174,
"eval_overall_precision": 0.762962962962963,
"eval_overall_recall": 0.8803418803418803,
"eval_runtime": 0.3755,
"eval_samples_per_second": 498.003,
"eval_steps_per_second": 7.989,
"step": 8798
},
{
"epoch": 84.0,
"grad_norm": 1.0442496538162231,
"learning_rate": 8.000000000000001e-06,
"loss": 0.0719,
"step": 8904
},
{
"epoch": 84.0,
"eval_LOCATION_f1": 0.7770700636942677,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.7261904761904762,
"eval_LOCATION_recall": 0.8356164383561644,
"eval_ORGANIZATION_f1": 0.738255033557047,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6547619047619048,
"eval_ORGANIZATION_recall": 0.8461538461538461,
"eval_PERSON_f1": 0.887459807073955,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8571428571428571,
"eval_PERSON_recall": 0.92,
"eval_QUANTITY_f1": 0.7076923076923076,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.6388888888888888,
"eval_QUANTITY_recall": 0.7931034482758621,
"eval_TIME_f1": 0.8421052631578947,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.7619047619047619,
"eval_TIME_recall": 0.9411764705882353,
"eval_loss": 0.1436508744955063,
"eval_overall_accuracy": 0.9579128722618755,
"eval_overall_f1": 0.8153034300791556,
"eval_overall_precision": 0.7592137592137592,
"eval_overall_recall": 0.8803418803418803,
"eval_runtime": 0.3727,
"eval_samples_per_second": 501.681,
"eval_steps_per_second": 8.048,
"step": 8904
},
{
"epoch": 85.0,
"grad_norm": 1.8608384132385254,
"learning_rate": 7.5e-06,
"loss": 0.0709,
"step": 9010
},
{
"epoch": 85.0,
"eval_LOCATION_f1": 0.7770700636942677,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.7261904761904762,
"eval_LOCATION_recall": 0.8356164383561644,
"eval_ORGANIZATION_f1": 0.7297297297297298,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6506024096385542,
"eval_ORGANIZATION_recall": 0.8307692307692308,
"eval_PERSON_f1": 0.887459807073955,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8571428571428571,
"eval_PERSON_recall": 0.92,
"eval_QUANTITY_f1": 0.7076923076923076,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.6388888888888888,
"eval_QUANTITY_recall": 0.7931034482758621,
"eval_TIME_f1": 0.8,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.7317073170731707,
"eval_TIME_recall": 0.8823529411764706,
"eval_loss": 0.14415280520915985,
"eval_overall_accuracy": 0.9574206251538272,
"eval_overall_f1": 0.8095238095238095,
"eval_overall_precision": 0.7555555555555555,
"eval_overall_recall": 0.8717948717948718,
"eval_runtime": 0.3737,
"eval_samples_per_second": 500.35,
"eval_steps_per_second": 8.027,
"step": 9010
},
{
"epoch": 86.0,
"grad_norm": 1.1902055740356445,
"learning_rate": 7.000000000000001e-06,
"loss": 0.0699,
"step": 9116
},
{
"epoch": 86.0,
"eval_LOCATION_f1": 0.7870967741935484,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.7439024390243902,
"eval_LOCATION_recall": 0.8356164383561644,
"eval_ORGANIZATION_f1": 0.7346938775510204,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6585365853658537,
"eval_ORGANIZATION_recall": 0.8307692307692308,
"eval_PERSON_f1": 0.887459807073955,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8571428571428571,
"eval_PERSON_recall": 0.92,
"eval_QUANTITY_f1": 0.7076923076923076,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.6388888888888888,
"eval_QUANTITY_recall": 0.7931034482758621,
"eval_TIME_f1": 0.8421052631578947,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.7619047619047619,
"eval_TIME_recall": 0.9411764705882353,
"eval_loss": 0.14072592556476593,
"eval_overall_accuracy": 0.958897366477972,
"eval_overall_f1": 0.8169761273209548,
"eval_overall_precision": 0.7642679900744417,
"eval_overall_recall": 0.8774928774928775,
"eval_runtime": 0.3749,
"eval_samples_per_second": 498.822,
"eval_steps_per_second": 8.002,
"step": 9116
},
{
"epoch": 87.0,
"grad_norm": 0.9288851022720337,
"learning_rate": 6.5000000000000004e-06,
"loss": 0.0681,
"step": 9222
},
{
"epoch": 87.0,
"eval_LOCATION_f1": 0.7820512820512822,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.7349397590361446,
"eval_LOCATION_recall": 0.8356164383561644,
"eval_ORGANIZATION_f1": 0.7346938775510204,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6585365853658537,
"eval_ORGANIZATION_recall": 0.8307692307692308,
"eval_PERSON_f1": 0.887459807073955,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8571428571428571,
"eval_PERSON_recall": 0.92,
"eval_QUANTITY_f1": 0.71875,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.6571428571428571,
"eval_QUANTITY_recall": 0.7931034482758621,
"eval_TIME_f1": 0.8421052631578947,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.7619047619047619,
"eval_TIME_recall": 0.9411764705882353,
"eval_loss": 0.14135389029979706,
"eval_overall_accuracy": 0.958897366477972,
"eval_overall_f1": 0.8169761273209548,
"eval_overall_precision": 0.7642679900744417,
"eval_overall_recall": 0.8774928774928775,
"eval_runtime": 0.3733,
"eval_samples_per_second": 500.974,
"eval_steps_per_second": 8.037,
"step": 9222
},
{
"epoch": 88.0,
"grad_norm": 1.107254981994629,
"learning_rate": 6e-06,
"loss": 0.0685,
"step": 9328
},
{
"epoch": 88.0,
"eval_LOCATION_f1": 0.7770700636942677,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.7261904761904762,
"eval_LOCATION_recall": 0.8356164383561644,
"eval_ORGANIZATION_f1": 0.7346938775510204,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6585365853658537,
"eval_ORGANIZATION_recall": 0.8307692307692308,
"eval_PERSON_f1": 0.8846153846153846,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8518518518518519,
"eval_PERSON_recall": 0.92,
"eval_QUANTITY_f1": 0.7076923076923076,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.6388888888888888,
"eval_QUANTITY_recall": 0.7931034482758621,
"eval_TIME_f1": 0.8533333333333334,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.7804878048780488,
"eval_TIME_recall": 0.9411764705882353,
"eval_loss": 0.14269116520881653,
"eval_overall_accuracy": 0.9579128722618755,
"eval_overall_f1": 0.8148148148148149,
"eval_overall_precision": 0.7604938271604939,
"eval_overall_recall": 0.8774928774928775,
"eval_runtime": 0.378,
"eval_samples_per_second": 494.729,
"eval_steps_per_second": 7.937,
"step": 9328
},
{
"epoch": 89.0,
"grad_norm": 2.199923276901245,
"learning_rate": 5.500000000000001e-06,
"loss": 0.0703,
"step": 9434
},
{
"epoch": 89.0,
"eval_LOCATION_f1": 0.7870967741935484,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.7439024390243902,
"eval_LOCATION_recall": 0.8356164383561644,
"eval_ORGANIZATION_f1": 0.7310344827586207,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6625,
"eval_ORGANIZATION_recall": 0.8153846153846154,
"eval_PERSON_f1": 0.887459807073955,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8571428571428571,
"eval_PERSON_recall": 0.92,
"eval_QUANTITY_f1": 0.7076923076923076,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.6388888888888888,
"eval_QUANTITY_recall": 0.7931034482758621,
"eval_TIME_f1": 0.8648648648648648,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.8,
"eval_TIME_recall": 0.9411764705882353,
"eval_loss": 0.14063221216201782,
"eval_overall_accuracy": 0.9593896135860202,
"eval_overall_f1": 0.8186666666666667,
"eval_overall_precision": 0.7694235588972431,
"eval_overall_recall": 0.8746438746438746,
"eval_runtime": 0.3757,
"eval_samples_per_second": 497.751,
"eval_steps_per_second": 7.985,
"step": 9434
},
{
"epoch": 90.0,
"grad_norm": 1.6066433191299438,
"learning_rate": 5e-06,
"loss": 0.0695,
"step": 9540
},
{
"epoch": 90.0,
"eval_LOCATION_f1": 0.7870967741935484,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.7439024390243902,
"eval_LOCATION_recall": 0.8356164383561644,
"eval_ORGANIZATION_f1": 0.726027397260274,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.654320987654321,
"eval_ORGANIZATION_recall": 0.8153846153846154,
"eval_PERSON_f1": 0.887459807073955,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8571428571428571,
"eval_PERSON_recall": 0.92,
"eval_QUANTITY_f1": 0.7076923076923076,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.6388888888888888,
"eval_QUANTITY_recall": 0.7931034482758621,
"eval_TIME_f1": 0.8767123287671232,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.8205128205128205,
"eval_TIME_recall": 0.9411764705882353,
"eval_loss": 0.13843446969985962,
"eval_overall_accuracy": 0.9601279842480925,
"eval_overall_f1": 0.8186666666666667,
"eval_overall_precision": 0.7694235588972431,
"eval_overall_recall": 0.8746438746438746,
"eval_runtime": 0.3746,
"eval_samples_per_second": 499.225,
"eval_steps_per_second": 8.009,
"step": 9540
},
{
"epoch": 91.0,
"grad_norm": 1.384969711303711,
"learning_rate": 4.5e-06,
"loss": 0.0684,
"step": 9646
},
{
"epoch": 91.0,
"eval_LOCATION_f1": 0.7770700636942677,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.7261904761904762,
"eval_LOCATION_recall": 0.8356164383561644,
"eval_ORGANIZATION_f1": 0.7210884353741497,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6463414634146342,
"eval_ORGANIZATION_recall": 0.8153846153846154,
"eval_PERSON_f1": 0.8817891373801918,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8466257668711656,
"eval_PERSON_recall": 0.92,
"eval_QUANTITY_f1": 0.7076923076923076,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.6388888888888888,
"eval_QUANTITY_recall": 0.7931034482758621,
"eval_TIME_f1": 0.8421052631578947,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.7619047619047619,
"eval_TIME_recall": 0.9411764705882353,
"eval_loss": 0.14361019432544708,
"eval_overall_accuracy": 0.956928378045779,
"eval_overall_f1": 0.8100263852242744,
"eval_overall_precision": 0.7542997542997543,
"eval_overall_recall": 0.8746438746438746,
"eval_runtime": 0.3739,
"eval_samples_per_second": 500.193,
"eval_steps_per_second": 8.024,
"step": 9646
},
{
"epoch": 92.0,
"grad_norm": 1.5777561664581299,
"learning_rate": 4.000000000000001e-06,
"loss": 0.0681,
"step": 9752
},
{
"epoch": 92.0,
"eval_LOCATION_f1": 0.7870967741935484,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.7439024390243902,
"eval_LOCATION_recall": 0.8356164383561644,
"eval_ORGANIZATION_f1": 0.726027397260274,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.654320987654321,
"eval_ORGANIZATION_recall": 0.8153846153846154,
"eval_PERSON_f1": 0.887459807073955,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8571428571428571,
"eval_PERSON_recall": 0.92,
"eval_QUANTITY_f1": 0.7076923076923076,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.6388888888888888,
"eval_QUANTITY_recall": 0.7931034482758621,
"eval_TIME_f1": 0.8533333333333334,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.7804878048780488,
"eval_TIME_recall": 0.9411764705882353,
"eval_loss": 0.14141333103179932,
"eval_overall_accuracy": 0.9591434900319961,
"eval_overall_f1": 0.8164893617021275,
"eval_overall_precision": 0.7655860349127181,
"eval_overall_recall": 0.8746438746438746,
"eval_runtime": 0.3754,
"eval_samples_per_second": 498.089,
"eval_steps_per_second": 7.991,
"step": 9752
},
{
"epoch": 93.0,
"grad_norm": 0.12837229669094086,
"learning_rate": 3.5000000000000004e-06,
"loss": 0.0694,
"step": 9858
},
{
"epoch": 93.0,
"eval_LOCATION_f1": 0.7820512820512822,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.7349397590361446,
"eval_LOCATION_recall": 0.8356164383561644,
"eval_ORGANIZATION_f1": 0.7346938775510204,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6585365853658537,
"eval_ORGANIZATION_recall": 0.8307692307692308,
"eval_PERSON_f1": 0.887459807073955,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8571428571428571,
"eval_PERSON_recall": 0.92,
"eval_QUANTITY_f1": 0.7076923076923076,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.6388888888888888,
"eval_QUANTITY_recall": 0.7931034482758621,
"eval_TIME_f1": 0.8157894736842106,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.7380952380952381,
"eval_TIME_recall": 0.9117647058823529,
"eval_loss": 0.14285434782505035,
"eval_overall_accuracy": 0.9584051193699237,
"eval_overall_f1": 0.8132450331125828,
"eval_overall_precision": 0.7599009900990099,
"eval_overall_recall": 0.8746438746438746,
"eval_runtime": 0.3737,
"eval_samples_per_second": 500.447,
"eval_steps_per_second": 8.029,
"step": 9858
},
{
"epoch": 94.0,
"grad_norm": 1.4026833772659302,
"learning_rate": 3e-06,
"loss": 0.068,
"step": 9964
},
{
"epoch": 94.0,
"eval_LOCATION_f1": 0.7820512820512822,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.7349397590361446,
"eval_LOCATION_recall": 0.8356164383561644,
"eval_ORGANIZATION_f1": 0.726027397260274,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.654320987654321,
"eval_ORGANIZATION_recall": 0.8153846153846154,
"eval_PERSON_f1": 0.887459807073955,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8571428571428571,
"eval_PERSON_recall": 0.92,
"eval_QUANTITY_f1": 0.7076923076923076,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.6388888888888888,
"eval_QUANTITY_recall": 0.7931034482758621,
"eval_TIME_f1": 0.8421052631578947,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.7619047619047619,
"eval_TIME_recall": 0.9411764705882353,
"eval_loss": 0.14125195145606995,
"eval_overall_accuracy": 0.9581589958158996,
"eval_overall_f1": 0.8143236074270558,
"eval_overall_precision": 0.7617866004962779,
"eval_overall_recall": 0.8746438746438746,
"eval_runtime": 0.3714,
"eval_samples_per_second": 503.459,
"eval_steps_per_second": 8.077,
"step": 9964
},
{
"epoch": 95.0,
"grad_norm": 2.012713670730591,
"learning_rate": 2.5e-06,
"loss": 0.0682,
"step": 10070
},
{
"epoch": 95.0,
"eval_LOCATION_f1": 0.7820512820512822,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.7349397590361446,
"eval_LOCATION_recall": 0.8356164383561644,
"eval_ORGANIZATION_f1": 0.7346938775510204,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6585365853658537,
"eval_ORGANIZATION_recall": 0.8307692307692308,
"eval_PERSON_f1": 0.887459807073955,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8571428571428571,
"eval_PERSON_recall": 0.92,
"eval_QUANTITY_f1": 0.7076923076923076,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.6388888888888888,
"eval_QUANTITY_recall": 0.7931034482758621,
"eval_TIME_f1": 0.8157894736842106,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.7380952380952381,
"eval_TIME_recall": 0.9117647058823529,
"eval_loss": 0.1429029256105423,
"eval_overall_accuracy": 0.9581589958158996,
"eval_overall_f1": 0.8132450331125828,
"eval_overall_precision": 0.7599009900990099,
"eval_overall_recall": 0.8746438746438746,
"eval_runtime": 0.3742,
"eval_samples_per_second": 499.707,
"eval_steps_per_second": 8.017,
"step": 10070
},
{
"epoch": 96.0,
"grad_norm": 0.9533500671386719,
"learning_rate": 2.0000000000000003e-06,
"loss": 0.0697,
"step": 10176
},
{
"epoch": 96.0,
"eval_LOCATION_f1": 0.7820512820512822,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.7349397590361446,
"eval_LOCATION_recall": 0.8356164383561644,
"eval_ORGANIZATION_f1": 0.726027397260274,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.654320987654321,
"eval_ORGANIZATION_recall": 0.8153846153846154,
"eval_PERSON_f1": 0.887459807073955,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8571428571428571,
"eval_PERSON_recall": 0.92,
"eval_QUANTITY_f1": 0.7076923076923076,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.6388888888888888,
"eval_QUANTITY_recall": 0.7931034482758621,
"eval_TIME_f1": 0.8157894736842106,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.7380952380952381,
"eval_TIME_recall": 0.9117647058823529,
"eval_loss": 0.14225105941295624,
"eval_overall_accuracy": 0.9579128722618755,
"eval_overall_f1": 0.8116710875331565,
"eval_overall_precision": 0.7593052109181141,
"eval_overall_recall": 0.8717948717948718,
"eval_runtime": 0.3776,
"eval_samples_per_second": 495.257,
"eval_steps_per_second": 7.945,
"step": 10176
},
{
"epoch": 97.0,
"grad_norm": 0.8223116397857666,
"learning_rate": 1.5e-06,
"loss": 0.0672,
"step": 10282
},
{
"epoch": 97.0,
"eval_LOCATION_f1": 0.7820512820512822,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.7349397590361446,
"eval_LOCATION_recall": 0.8356164383561644,
"eval_ORGANIZATION_f1": 0.726027397260274,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.654320987654321,
"eval_ORGANIZATION_recall": 0.8153846153846154,
"eval_PERSON_f1": 0.887459807073955,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8571428571428571,
"eval_PERSON_recall": 0.92,
"eval_QUANTITY_f1": 0.7076923076923076,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.6388888888888888,
"eval_QUANTITY_recall": 0.7931034482758621,
"eval_TIME_f1": 0.8157894736842106,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.7380952380952381,
"eval_TIME_recall": 0.9117647058823529,
"eval_loss": 0.14218071103096008,
"eval_overall_accuracy": 0.9579128722618755,
"eval_overall_f1": 0.8116710875331565,
"eval_overall_precision": 0.7593052109181141,
"eval_overall_recall": 0.8717948717948718,
"eval_runtime": 0.3739,
"eval_samples_per_second": 500.069,
"eval_steps_per_second": 8.022,
"step": 10282
},
{
"epoch": 98.0,
"grad_norm": 3.7341294288635254,
"learning_rate": 1.0000000000000002e-06,
"loss": 0.0674,
"step": 10388
},
{
"epoch": 98.0,
"eval_LOCATION_f1": 0.7820512820512822,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.7349397590361446,
"eval_LOCATION_recall": 0.8356164383561644,
"eval_ORGANIZATION_f1": 0.7346938775510204,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6585365853658537,
"eval_ORGANIZATION_recall": 0.8307692307692308,
"eval_PERSON_f1": 0.887459807073955,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8571428571428571,
"eval_PERSON_recall": 0.92,
"eval_QUANTITY_f1": 0.7076923076923076,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.6388888888888888,
"eval_QUANTITY_recall": 0.7931034482758621,
"eval_TIME_f1": 0.8157894736842106,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.7380952380952381,
"eval_TIME_recall": 0.9117647058823529,
"eval_loss": 0.14276809990406036,
"eval_overall_accuracy": 0.9584051193699237,
"eval_overall_f1": 0.8132450331125828,
"eval_overall_precision": 0.7599009900990099,
"eval_overall_recall": 0.8746438746438746,
"eval_runtime": 0.3733,
"eval_samples_per_second": 500.927,
"eval_steps_per_second": 8.036,
"step": 10388
},
{
"epoch": 99.0,
"grad_norm": 0.9920492768287659,
"learning_rate": 5.000000000000001e-07,
"loss": 0.0666,
"step": 10494
},
{
"epoch": 99.0,
"eval_LOCATION_f1": 0.7820512820512822,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.7349397590361446,
"eval_LOCATION_recall": 0.8356164383561644,
"eval_ORGANIZATION_f1": 0.726027397260274,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.654320987654321,
"eval_ORGANIZATION_recall": 0.8153846153846154,
"eval_PERSON_f1": 0.887459807073955,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8571428571428571,
"eval_PERSON_recall": 0.92,
"eval_QUANTITY_f1": 0.7076923076923076,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.6388888888888888,
"eval_QUANTITY_recall": 0.7931034482758621,
"eval_TIME_f1": 0.8157894736842106,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.7380952380952381,
"eval_TIME_recall": 0.9117647058823529,
"eval_loss": 0.14194943010807037,
"eval_overall_accuracy": 0.9581589958158996,
"eval_overall_f1": 0.8116710875331565,
"eval_overall_precision": 0.7593052109181141,
"eval_overall_recall": 0.8717948717948718,
"eval_runtime": 0.3735,
"eval_samples_per_second": 500.685,
"eval_steps_per_second": 8.032,
"step": 10494
},
{
"epoch": 100.0,
"grad_norm": 0.6790415644645691,
"learning_rate": 0.0,
"loss": 0.0693,
"step": 10600
},
{
"epoch": 100.0,
"eval_LOCATION_f1": 0.7820512820512822,
"eval_LOCATION_number": 73,
"eval_LOCATION_precision": 0.7349397590361446,
"eval_LOCATION_recall": 0.8356164383561644,
"eval_ORGANIZATION_f1": 0.726027397260274,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.654320987654321,
"eval_ORGANIZATION_recall": 0.8153846153846154,
"eval_PERSON_f1": 0.887459807073955,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8571428571428571,
"eval_PERSON_recall": 0.92,
"eval_QUANTITY_f1": 0.7076923076923076,
"eval_QUANTITY_number": 29,
"eval_QUANTITY_precision": 0.6388888888888888,
"eval_QUANTITY_recall": 0.7931034482758621,
"eval_TIME_f1": 0.8157894736842106,
"eval_TIME_number": 34,
"eval_TIME_precision": 0.7380952380952381,
"eval_TIME_recall": 0.9117647058823529,
"eval_loss": 0.1422806829214096,
"eval_overall_accuracy": 0.9581589958158996,
"eval_overall_f1": 0.8116710875331565,
"eval_overall_precision": 0.7593052109181141,
"eval_overall_recall": 0.8717948717948718,
"eval_runtime": 0.3745,
"eval_samples_per_second": 499.395,
"eval_steps_per_second": 8.012,
"step": 10600
},
{
"epoch": 100.0,
"step": 10600,
"total_flos": 4551589111445376.0,
"train_loss": 0.12385802520895904,
"train_runtime": 580.0713,
"train_samples_per_second": 290.999,
"train_steps_per_second": 18.274
}
],
"logging_steps": 500,
"max_steps": 10600,
"num_input_tokens_seen": 0,
"num_train_epochs": 100,
"save_steps": 500,
"total_flos": 4551589111445376.0,
"train_batch_size": 16,
"trial_name": null,
"trial_params": null
}