|
{ |
|
"best_metric": null, |
|
"best_model_checkpoint": null, |
|
"epoch": 100.0, |
|
"eval_steps": 500, |
|
"global_step": 10600, |
|
"is_hyper_param_search": false, |
|
"is_local_process_zero": true, |
|
"is_world_process_zero": true, |
|
"log_history": [ |
|
{ |
|
"epoch": 1.0, |
|
"grad_norm": 1.549831748008728, |
|
"learning_rate": 4.9500000000000004e-05, |
|
"loss": 1.1472, |
|
"step": 106 |
|
}, |
|
{ |
|
"epoch": 1.0, |
|
"eval_LOCATION_f1": 0.0, |
|
"eval_LOCATION_number": 73, |
|
"eval_LOCATION_precision": 0.0, |
|
"eval_LOCATION_recall": 0.0, |
|
"eval_ORGANIZATION_f1": 0.0, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.0, |
|
"eval_ORGANIZATION_recall": 0.0, |
|
"eval_PERSON_f1": 0.0, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.0, |
|
"eval_PERSON_recall": 0.0, |
|
"eval_QUANTITY_f1": 0.0, |
|
"eval_QUANTITY_number": 29, |
|
"eval_QUANTITY_precision": 0.0, |
|
"eval_QUANTITY_recall": 0.0, |
|
"eval_TIME_f1": 0.0, |
|
"eval_TIME_number": 34, |
|
"eval_TIME_precision": 0.0, |
|
"eval_TIME_recall": 0.0, |
|
"eval_loss": 0.7123244404792786, |
|
"eval_overall_accuracy": 0.8365739601279842, |
|
"eval_overall_f1": 0.0, |
|
"eval_overall_precision": 0.0, |
|
"eval_overall_recall": 0.0, |
|
"eval_runtime": 0.3731, |
|
"eval_samples_per_second": 501.176, |
|
"eval_steps_per_second": 8.04, |
|
"step": 106 |
|
}, |
|
{ |
|
"epoch": 2.0, |
|
"grad_norm": 1.0792208909988403, |
|
"learning_rate": 4.9e-05, |
|
"loss": 0.6802, |
|
"step": 212 |
|
}, |
|
{ |
|
"epoch": 2.0, |
|
"eval_LOCATION_f1": 0.0, |
|
"eval_LOCATION_number": 73, |
|
"eval_LOCATION_precision": 0.0, |
|
"eval_LOCATION_recall": 0.0, |
|
"eval_ORGANIZATION_f1": 0.0, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.0, |
|
"eval_ORGANIZATION_recall": 0.0, |
|
"eval_PERSON_f1": 0.012738853503184716, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.14285714285714285, |
|
"eval_PERSON_recall": 0.006666666666666667, |
|
"eval_QUANTITY_f1": 0.0, |
|
"eval_QUANTITY_number": 29, |
|
"eval_QUANTITY_precision": 0.0, |
|
"eval_QUANTITY_recall": 0.0, |
|
"eval_TIME_f1": 0.0, |
|
"eval_TIME_number": 34, |
|
"eval_TIME_precision": 0.0, |
|
"eval_TIME_recall": 0.0, |
|
"eval_loss": 0.5882730484008789, |
|
"eval_overall_accuracy": 0.8385429485601772, |
|
"eval_overall_f1": 0.005524861878453039, |
|
"eval_overall_precision": 0.09090909090909091, |
|
"eval_overall_recall": 0.002849002849002849, |
|
"eval_runtime": 0.3704, |
|
"eval_samples_per_second": 504.825, |
|
"eval_steps_per_second": 8.099, |
|
"step": 212 |
|
}, |
|
{ |
|
"epoch": 3.0, |
|
"grad_norm": 1.0924339294433594, |
|
"learning_rate": 4.85e-05, |
|
"loss": 0.56, |
|
"step": 318 |
|
}, |
|
{ |
|
"epoch": 3.0, |
|
"eval_LOCATION_f1": 0.1176470588235294, |
|
"eval_LOCATION_number": 73, |
|
"eval_LOCATION_precision": 0.4166666666666667, |
|
"eval_LOCATION_recall": 0.0684931506849315, |
|
"eval_ORGANIZATION_f1": 0.025974025974025976, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.08333333333333333, |
|
"eval_ORGANIZATION_recall": 0.015384615384615385, |
|
"eval_PERSON_f1": 0.17674418604651165, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.2923076923076923, |
|
"eval_PERSON_recall": 0.12666666666666668, |
|
"eval_QUANTITY_f1": 0.0, |
|
"eval_QUANTITY_number": 29, |
|
"eval_QUANTITY_precision": 0.0, |
|
"eval_QUANTITY_recall": 0.0, |
|
"eval_TIME_f1": 0.25925925925925924, |
|
"eval_TIME_number": 34, |
|
"eval_TIME_precision": 0.35, |
|
"eval_TIME_recall": 0.20588235294117646, |
|
"eval_loss": 0.4647313952445984, |
|
"eval_overall_accuracy": 0.8616785626384444, |
|
"eval_overall_f1": 0.1391304347826087, |
|
"eval_overall_precision": 0.29357798165137616, |
|
"eval_overall_recall": 0.09116809116809117, |
|
"eval_runtime": 0.3714, |
|
"eval_samples_per_second": 503.536, |
|
"eval_steps_per_second": 8.078, |
|
"step": 318 |
|
}, |
|
{ |
|
"epoch": 4.0, |
|
"grad_norm": 1.4220308065414429, |
|
"learning_rate": 4.8e-05, |
|
"loss": 0.4294, |
|
"step": 424 |
|
}, |
|
{ |
|
"epoch": 4.0, |
|
"eval_LOCATION_f1": 0.39669421487603307, |
|
"eval_LOCATION_number": 73, |
|
"eval_LOCATION_precision": 0.5, |
|
"eval_LOCATION_recall": 0.3287671232876712, |
|
"eval_ORGANIZATION_f1": 0.12903225806451613, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.21428571428571427, |
|
"eval_ORGANIZATION_recall": 0.09230769230769231, |
|
"eval_PERSON_f1": 0.6538461538461539, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.6296296296296297, |
|
"eval_PERSON_recall": 0.68, |
|
"eval_QUANTITY_f1": 0.13333333333333333, |
|
"eval_QUANTITY_number": 29, |
|
"eval_QUANTITY_precision": 0.1875, |
|
"eval_QUANTITY_recall": 0.10344827586206896, |
|
"eval_TIME_f1": 0.5671641791044776, |
|
"eval_TIME_number": 34, |
|
"eval_TIME_precision": 0.5757575757575758, |
|
"eval_TIME_recall": 0.5588235294117647, |
|
"eval_loss": 0.3323652446269989, |
|
"eval_overall_accuracy": 0.907703667240955, |
|
"eval_overall_f1": 0.4827586206896552, |
|
"eval_overall_precision": 0.5365853658536586, |
|
"eval_overall_recall": 0.43874643874643876, |
|
"eval_runtime": 0.374, |
|
"eval_samples_per_second": 500.058, |
|
"eval_steps_per_second": 8.022, |
|
"step": 424 |
|
}, |
|
{ |
|
"epoch": 5.0, |
|
"grad_norm": 1.3654524087905884, |
|
"learning_rate": 4.75e-05, |
|
"loss": 0.324, |
|
"step": 530 |
|
}, |
|
{ |
|
"epoch": 5.0, |
|
"eval_LOCATION_f1": 0.564102564102564, |
|
"eval_LOCATION_number": 73, |
|
"eval_LOCATION_precision": 0.5301204819277109, |
|
"eval_LOCATION_recall": 0.6027397260273972, |
|
"eval_ORGANIZATION_f1": 0.45255474452554745, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.4305555555555556, |
|
"eval_ORGANIZATION_recall": 0.47692307692307695, |
|
"eval_PERSON_f1": 0.8263473053892216, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.75, |
|
"eval_PERSON_recall": 0.92, |
|
"eval_QUANTITY_f1": 0.39999999999999997, |
|
"eval_QUANTITY_number": 29, |
|
"eval_QUANTITY_precision": 0.3870967741935484, |
|
"eval_QUANTITY_recall": 0.41379310344827586, |
|
"eval_TIME_f1": 0.6849315068493151, |
|
"eval_TIME_number": 34, |
|
"eval_TIME_precision": 0.6410256410256411, |
|
"eval_TIME_recall": 0.7352941176470589, |
|
"eval_loss": 0.26078376173973083, |
|
"eval_overall_accuracy": 0.9308392813192222, |
|
"eval_overall_f1": 0.6578947368421052, |
|
"eval_overall_precision": 0.6112469437652812, |
|
"eval_overall_recall": 0.7122507122507122, |
|
"eval_runtime": 0.3725, |
|
"eval_samples_per_second": 502.055, |
|
"eval_steps_per_second": 8.054, |
|
"step": 530 |
|
}, |
|
{ |
|
"epoch": 6.0, |
|
"grad_norm": 1.6405872106552124, |
|
"learning_rate": 4.7e-05, |
|
"loss": 0.2665, |
|
"step": 636 |
|
}, |
|
{ |
|
"epoch": 6.0, |
|
"eval_LOCATION_f1": 0.6826347305389222, |
|
"eval_LOCATION_number": 73, |
|
"eval_LOCATION_precision": 0.6063829787234043, |
|
"eval_LOCATION_recall": 0.7808219178082192, |
|
"eval_ORGANIZATION_f1": 0.5394736842105263, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.47126436781609193, |
|
"eval_ORGANIZATION_recall": 0.6307692307692307, |
|
"eval_PERSON_f1": 0.8363636363636363, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.7666666666666667, |
|
"eval_PERSON_recall": 0.92, |
|
"eval_QUANTITY_f1": 0.4444444444444445, |
|
"eval_QUANTITY_number": 29, |
|
"eval_QUANTITY_precision": 0.4117647058823529, |
|
"eval_QUANTITY_recall": 0.4827586206896552, |
|
"eval_TIME_f1": 0.7027027027027027, |
|
"eval_TIME_number": 34, |
|
"eval_TIME_precision": 0.65, |
|
"eval_TIME_recall": 0.7647058823529411, |
|
"eval_loss": 0.23299816250801086, |
|
"eval_overall_accuracy": 0.934531134629584, |
|
"eval_overall_f1": 0.7022900763358779, |
|
"eval_overall_precision": 0.6344827586206897, |
|
"eval_overall_recall": 0.7863247863247863, |
|
"eval_runtime": 0.3778, |
|
"eval_samples_per_second": 494.969, |
|
"eval_steps_per_second": 7.941, |
|
"step": 636 |
|
}, |
|
{ |
|
"epoch": 7.0, |
|
"grad_norm": 1.7495594024658203, |
|
"learning_rate": 4.6500000000000005e-05, |
|
"loss": 0.2275, |
|
"step": 742 |
|
}, |
|
{ |
|
"epoch": 7.0, |
|
"eval_LOCATION_f1": 0.7349397590361444, |
|
"eval_LOCATION_number": 73, |
|
"eval_LOCATION_precision": 0.6559139784946236, |
|
"eval_LOCATION_recall": 0.8356164383561644, |
|
"eval_ORGANIZATION_f1": 0.5660377358490566, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.4787234042553192, |
|
"eval_ORGANIZATION_recall": 0.6923076923076923, |
|
"eval_PERSON_f1": 0.8475609756097561, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.7808988764044944, |
|
"eval_PERSON_recall": 0.9266666666666666, |
|
"eval_QUANTITY_f1": 0.4444444444444445, |
|
"eval_QUANTITY_number": 29, |
|
"eval_QUANTITY_precision": 0.4117647058823529, |
|
"eval_QUANTITY_recall": 0.4827586206896552, |
|
"eval_TIME_f1": 0.7027027027027027, |
|
"eval_TIME_number": 34, |
|
"eval_TIME_precision": 0.65, |
|
"eval_TIME_recall": 0.7647058823529411, |
|
"eval_loss": 0.19754259288311005, |
|
"eval_overall_accuracy": 0.9392074821560423, |
|
"eval_overall_f1": 0.7215189873417722, |
|
"eval_overall_precision": 0.6492027334851936, |
|
"eval_overall_recall": 0.811965811965812, |
|
"eval_runtime": 0.382, |
|
"eval_samples_per_second": 489.509, |
|
"eval_steps_per_second": 7.853, |
|
"step": 742 |
|
}, |
|
{ |
|
"epoch": 8.0, |
|
"grad_norm": 1.2530863285064697, |
|
"learning_rate": 4.600000000000001e-05, |
|
"loss": 0.2049, |
|
"step": 848 |
|
}, |
|
{ |
|
"epoch": 8.0, |
|
"eval_LOCATION_f1": 0.7283236994219653, |
|
"eval_LOCATION_number": 73, |
|
"eval_LOCATION_precision": 0.63, |
|
"eval_LOCATION_recall": 0.863013698630137, |
|
"eval_ORGANIZATION_f1": 0.5256410256410257, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.45054945054945056, |
|
"eval_ORGANIZATION_recall": 0.6307692307692307, |
|
"eval_PERSON_f1": 0.851851851851852, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.7931034482758621, |
|
"eval_PERSON_recall": 0.92, |
|
"eval_QUANTITY_f1": 0.5538461538461539, |
|
"eval_QUANTITY_number": 29, |
|
"eval_QUANTITY_precision": 0.5, |
|
"eval_QUANTITY_recall": 0.6206896551724138, |
|
"eval_TIME_f1": 0.72, |
|
"eval_TIME_number": 34, |
|
"eval_TIME_precision": 0.6585365853658537, |
|
"eval_TIME_recall": 0.7941176470588235, |
|
"eval_loss": 0.1830800473690033, |
|
"eval_overall_accuracy": 0.9419148412503077, |
|
"eval_overall_f1": 0.7238335435056746, |
|
"eval_overall_precision": 0.6493212669683258, |
|
"eval_overall_recall": 0.8176638176638177, |
|
"eval_runtime": 0.3764, |
|
"eval_samples_per_second": 496.877, |
|
"eval_steps_per_second": 7.971, |
|
"step": 848 |
|
}, |
|
{ |
|
"epoch": 9.0, |
|
"grad_norm": 2.133810520172119, |
|
"learning_rate": 4.55e-05, |
|
"loss": 0.1888, |
|
"step": 954 |
|
}, |
|
{ |
|
"epoch": 9.0, |
|
"eval_LOCATION_f1": 0.7261904761904762, |
|
"eval_LOCATION_number": 73, |
|
"eval_LOCATION_precision": 0.6421052631578947, |
|
"eval_LOCATION_recall": 0.8356164383561644, |
|
"eval_ORGANIZATION_f1": 0.5822784810126582, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.4946236559139785, |
|
"eval_ORGANIZATION_recall": 0.7076923076923077, |
|
"eval_PERSON_f1": 0.8374999999999999, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.788235294117647, |
|
"eval_PERSON_recall": 0.8933333333333333, |
|
"eval_QUANTITY_f1": 0.47619047619047616, |
|
"eval_QUANTITY_number": 29, |
|
"eval_QUANTITY_precision": 0.4411764705882353, |
|
"eval_QUANTITY_recall": 0.5172413793103449, |
|
"eval_TIME_f1": 0.7105263157894737, |
|
"eval_TIME_number": 34, |
|
"eval_TIME_precision": 0.6428571428571429, |
|
"eval_TIME_recall": 0.7941176470588235, |
|
"eval_loss": 0.17504610121250153, |
|
"eval_overall_accuracy": 0.9431454590204282, |
|
"eval_overall_f1": 0.7210191082802548, |
|
"eval_overall_precision": 0.652073732718894, |
|
"eval_overall_recall": 0.8062678062678063, |
|
"eval_runtime": 0.3734, |
|
"eval_samples_per_second": 500.739, |
|
"eval_steps_per_second": 8.033, |
|
"step": 954 |
|
}, |
|
{ |
|
"epoch": 10.0, |
|
"grad_norm": 0.8962897658348083, |
|
"learning_rate": 4.5e-05, |
|
"loss": 0.1759, |
|
"step": 1060 |
|
}, |
|
{ |
|
"epoch": 10.0, |
|
"eval_LOCATION_f1": 0.7643312101910829, |
|
"eval_LOCATION_number": 73, |
|
"eval_LOCATION_precision": 0.7142857142857143, |
|
"eval_LOCATION_recall": 0.821917808219178, |
|
"eval_ORGANIZATION_f1": 0.6086956521739131, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.5104166666666666, |
|
"eval_ORGANIZATION_recall": 0.7538461538461538, |
|
"eval_PERSON_f1": 0.8348909657320873, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.783625730994152, |
|
"eval_PERSON_recall": 0.8933333333333333, |
|
"eval_QUANTITY_f1": 0.6060606060606061, |
|
"eval_QUANTITY_number": 29, |
|
"eval_QUANTITY_precision": 0.5405405405405406, |
|
"eval_QUANTITY_recall": 0.6896551724137931, |
|
"eval_TIME_f1": 0.7368421052631577, |
|
"eval_TIME_number": 34, |
|
"eval_TIME_precision": 0.6666666666666666, |
|
"eval_TIME_recall": 0.8235294117647058, |
|
"eval_loss": 0.16711482405662537, |
|
"eval_overall_accuracy": 0.9458528181146936, |
|
"eval_overall_f1": 0.7451984635083226, |
|
"eval_overall_precision": 0.6767441860465117, |
|
"eval_overall_recall": 0.8290598290598291, |
|
"eval_runtime": 0.3754, |
|
"eval_samples_per_second": 498.083, |
|
"eval_steps_per_second": 7.991, |
|
"step": 1060 |
|
}, |
|
{ |
|
"epoch": 11.0, |
|
"grad_norm": 1.1401879787445068, |
|
"learning_rate": 4.4500000000000004e-05, |
|
"loss": 0.1691, |
|
"step": 1166 |
|
}, |
|
{ |
|
"epoch": 11.0, |
|
"eval_LOCATION_f1": 0.7738095238095238, |
|
"eval_LOCATION_number": 73, |
|
"eval_LOCATION_precision": 0.6842105263157895, |
|
"eval_LOCATION_recall": 0.8904109589041096, |
|
"eval_ORGANIZATION_f1": 0.6415094339622641, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.5425531914893617, |
|
"eval_ORGANIZATION_recall": 0.7846153846153846, |
|
"eval_PERSON_f1": 0.8500000000000001, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8, |
|
"eval_PERSON_recall": 0.9066666666666666, |
|
"eval_QUANTITY_f1": 0.6363636363636365, |
|
"eval_QUANTITY_number": 29, |
|
"eval_QUANTITY_precision": 0.5675675675675675, |
|
"eval_QUANTITY_recall": 0.7241379310344828, |
|
"eval_TIME_f1": 0.7894736842105262, |
|
"eval_TIME_number": 34, |
|
"eval_TIME_precision": 0.7142857142857143, |
|
"eval_TIME_recall": 0.8823529411764706, |
|
"eval_loss": 0.16388720273971558, |
|
"eval_overall_accuracy": 0.9463450652227419, |
|
"eval_overall_f1": 0.7680608365019013, |
|
"eval_overall_precision": 0.6917808219178082, |
|
"eval_overall_recall": 0.8632478632478633, |
|
"eval_runtime": 0.3746, |
|
"eval_samples_per_second": 499.243, |
|
"eval_steps_per_second": 8.009, |
|
"step": 1166 |
|
}, |
|
{ |
|
"epoch": 12.0, |
|
"grad_norm": 1.234176754951477, |
|
"learning_rate": 4.4000000000000006e-05, |
|
"loss": 0.1569, |
|
"step": 1272 |
|
}, |
|
{ |
|
"epoch": 12.0, |
|
"eval_LOCATION_f1": 0.7901234567901235, |
|
"eval_LOCATION_number": 73, |
|
"eval_LOCATION_precision": 0.7191011235955056, |
|
"eval_LOCATION_recall": 0.8767123287671232, |
|
"eval_ORGANIZATION_f1": 0.625, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.5263157894736842, |
|
"eval_ORGANIZATION_recall": 0.7692307692307693, |
|
"eval_PERSON_f1": 0.8385093167701863, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.7848837209302325, |
|
"eval_PERSON_recall": 0.9, |
|
"eval_QUANTITY_f1": 0.6086956521739131, |
|
"eval_QUANTITY_number": 29, |
|
"eval_QUANTITY_precision": 0.525, |
|
"eval_QUANTITY_recall": 0.7241379310344828, |
|
"eval_TIME_f1": 0.7532467532467532, |
|
"eval_TIME_number": 34, |
|
"eval_TIME_precision": 0.6744186046511628, |
|
"eval_TIME_recall": 0.8529411764705882, |
|
"eval_loss": 0.16664613783359528, |
|
"eval_overall_accuracy": 0.9458528181146936, |
|
"eval_overall_f1": 0.7569620253164556, |
|
"eval_overall_precision": 0.6810933940774487, |
|
"eval_overall_recall": 0.8518518518518519, |
|
"eval_runtime": 0.3735, |
|
"eval_samples_per_second": 500.672, |
|
"eval_steps_per_second": 8.032, |
|
"step": 1272 |
|
}, |
|
{ |
|
"epoch": 13.0, |
|
"grad_norm": 1.1105190515518188, |
|
"learning_rate": 4.35e-05, |
|
"loss": 0.1512, |
|
"step": 1378 |
|
}, |
|
{ |
|
"epoch": 13.0, |
|
"eval_LOCATION_f1": 0.7749999999999999, |
|
"eval_LOCATION_number": 73, |
|
"eval_LOCATION_precision": 0.7126436781609196, |
|
"eval_LOCATION_recall": 0.8493150684931506, |
|
"eval_ORGANIZATION_f1": 0.6357615894039734, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.5581395348837209, |
|
"eval_ORGANIZATION_recall": 0.7384615384615385, |
|
"eval_PERSON_f1": 0.84375, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.7941176470588235, |
|
"eval_PERSON_recall": 0.9, |
|
"eval_QUANTITY_f1": 0.6268656716417911, |
|
"eval_QUANTITY_number": 29, |
|
"eval_QUANTITY_precision": 0.5526315789473685, |
|
"eval_QUANTITY_recall": 0.7241379310344828, |
|
"eval_TIME_f1": 0.8108108108108107, |
|
"eval_TIME_number": 34, |
|
"eval_TIME_precision": 0.75, |
|
"eval_TIME_recall": 0.8823529411764706, |
|
"eval_loss": 0.1505931168794632, |
|
"eval_overall_accuracy": 0.9510214127492, |
|
"eval_overall_f1": 0.766839378238342, |
|
"eval_overall_precision": 0.7030878859857482, |
|
"eval_overall_recall": 0.8433048433048433, |
|
"eval_runtime": 0.3701, |
|
"eval_samples_per_second": 505.237, |
|
"eval_steps_per_second": 8.105, |
|
"step": 1378 |
|
}, |
|
{ |
|
"epoch": 14.0, |
|
"grad_norm": 1.2889316082000732, |
|
"learning_rate": 4.3e-05, |
|
"loss": 0.1492, |
|
"step": 1484 |
|
}, |
|
{ |
|
"epoch": 14.0, |
|
"eval_LOCATION_f1": 0.7901234567901235, |
|
"eval_LOCATION_number": 73, |
|
"eval_LOCATION_precision": 0.7191011235955056, |
|
"eval_LOCATION_recall": 0.8767123287671232, |
|
"eval_ORGANIZATION_f1": 0.6257668711656441, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.5204081632653061, |
|
"eval_ORGANIZATION_recall": 0.7846153846153846, |
|
"eval_PERSON_f1": 0.8411214953271027, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.7894736842105263, |
|
"eval_PERSON_recall": 0.9, |
|
"eval_QUANTITY_f1": 0.6865671641791046, |
|
"eval_QUANTITY_number": 29, |
|
"eval_QUANTITY_precision": 0.6052631578947368, |
|
"eval_QUANTITY_recall": 0.7931034482758621, |
|
"eval_TIME_f1": 0.7894736842105262, |
|
"eval_TIME_number": 34, |
|
"eval_TIME_precision": 0.7142857142857143, |
|
"eval_TIME_recall": 0.8823529411764706, |
|
"eval_loss": 0.15868589282035828, |
|
"eval_overall_accuracy": 0.9483140536549348, |
|
"eval_overall_f1": 0.7680608365019013, |
|
"eval_overall_precision": 0.6917808219178082, |
|
"eval_overall_recall": 0.8632478632478633, |
|
"eval_runtime": 0.3734, |
|
"eval_samples_per_second": 500.783, |
|
"eval_steps_per_second": 8.034, |
|
"step": 1484 |
|
}, |
|
{ |
|
"epoch": 15.0, |
|
"grad_norm": 1.1166456937789917, |
|
"learning_rate": 4.25e-05, |
|
"loss": 0.1422, |
|
"step": 1590 |
|
}, |
|
{ |
|
"epoch": 15.0, |
|
"eval_LOCATION_f1": 0.7852760736196318, |
|
"eval_LOCATION_number": 73, |
|
"eval_LOCATION_precision": 0.7111111111111111, |
|
"eval_LOCATION_recall": 0.8767123287671232, |
|
"eval_ORGANIZATION_f1": 0.6134969325153374, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.5102040816326531, |
|
"eval_ORGANIZATION_recall": 0.7692307692307693, |
|
"eval_PERSON_f1": 0.8500000000000001, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8, |
|
"eval_PERSON_recall": 0.9066666666666666, |
|
"eval_QUANTITY_f1": 0.7272727272727273, |
|
"eval_QUANTITY_number": 29, |
|
"eval_QUANTITY_precision": 0.6486486486486487, |
|
"eval_QUANTITY_recall": 0.8275862068965517, |
|
"eval_TIME_f1": 0.8051948051948051, |
|
"eval_TIME_number": 34, |
|
"eval_TIME_precision": 0.7209302325581395, |
|
"eval_TIME_recall": 0.9117647058823529, |
|
"eval_loss": 0.15712317824363708, |
|
"eval_overall_accuracy": 0.9483140536549348, |
|
"eval_overall_f1": 0.7731305449936628, |
|
"eval_overall_precision": 0.6963470319634704, |
|
"eval_overall_recall": 0.8689458689458689, |
|
"eval_runtime": 0.3753, |
|
"eval_samples_per_second": 498.228, |
|
"eval_steps_per_second": 7.993, |
|
"step": 1590 |
|
}, |
|
{ |
|
"epoch": 16.0, |
|
"grad_norm": 1.7718479633331299, |
|
"learning_rate": 4.2e-05, |
|
"loss": 0.1386, |
|
"step": 1696 |
|
}, |
|
{ |
|
"epoch": 16.0, |
|
"eval_LOCATION_f1": 0.782608695652174, |
|
"eval_LOCATION_number": 73, |
|
"eval_LOCATION_precision": 0.7159090909090909, |
|
"eval_LOCATION_recall": 0.863013698630137, |
|
"eval_ORGANIZATION_f1": 0.6233766233766234, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.5393258426966292, |
|
"eval_ORGANIZATION_recall": 0.7384615384615385, |
|
"eval_PERSON_f1": 0.8714733542319748, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8224852071005917, |
|
"eval_PERSON_recall": 0.9266666666666666, |
|
"eval_QUANTITY_f1": 0.7352941176470588, |
|
"eval_QUANTITY_number": 29, |
|
"eval_QUANTITY_precision": 0.6410256410256411, |
|
"eval_QUANTITY_recall": 0.8620689655172413, |
|
"eval_TIME_f1": 0.7792207792207793, |
|
"eval_TIME_number": 34, |
|
"eval_TIME_precision": 0.6976744186046512, |
|
"eval_TIME_recall": 0.8823529411764706, |
|
"eval_loss": 0.1536765843629837, |
|
"eval_overall_accuracy": 0.9502830420871278, |
|
"eval_overall_f1": 0.7830551989730424, |
|
"eval_overall_precision": 0.7126168224299065, |
|
"eval_overall_recall": 0.8689458689458689, |
|
"eval_runtime": 0.3723, |
|
"eval_samples_per_second": 502.251, |
|
"eval_steps_per_second": 8.058, |
|
"step": 1696 |
|
}, |
|
{ |
|
"epoch": 17.0, |
|
"grad_norm": 2.4890553951263428, |
|
"learning_rate": 4.15e-05, |
|
"loss": 0.1351, |
|
"step": 1802 |
|
}, |
|
{ |
|
"epoch": 17.0, |
|
"eval_LOCATION_f1": 0.7974683544303799, |
|
"eval_LOCATION_number": 73, |
|
"eval_LOCATION_precision": 0.7411764705882353, |
|
"eval_LOCATION_recall": 0.863013698630137, |
|
"eval_ORGANIZATION_f1": 0.6219512195121952, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.5151515151515151, |
|
"eval_ORGANIZATION_recall": 0.7846153846153846, |
|
"eval_PERSON_f1": 0.8698412698412699, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8303030303030303, |
|
"eval_PERSON_recall": 0.9133333333333333, |
|
"eval_QUANTITY_f1": 0.7076923076923076, |
|
"eval_QUANTITY_number": 29, |
|
"eval_QUANTITY_precision": 0.6388888888888888, |
|
"eval_QUANTITY_recall": 0.7931034482758621, |
|
"eval_TIME_f1": 0.7894736842105262, |
|
"eval_TIME_number": 34, |
|
"eval_TIME_precision": 0.7142857142857143, |
|
"eval_TIME_recall": 0.8823529411764706, |
|
"eval_loss": 0.15198422968387604, |
|
"eval_overall_accuracy": 0.9500369185331036, |
|
"eval_overall_f1": 0.7814910025706941, |
|
"eval_overall_precision": 0.711943793911007, |
|
"eval_overall_recall": 0.8660968660968661, |
|
"eval_runtime": 0.3738, |
|
"eval_samples_per_second": 500.243, |
|
"eval_steps_per_second": 8.025, |
|
"step": 1802 |
|
}, |
|
{ |
|
"epoch": 18.0, |
|
"grad_norm": 3.517162561416626, |
|
"learning_rate": 4.1e-05, |
|
"loss": 0.1397, |
|
"step": 1908 |
|
}, |
|
{ |
|
"epoch": 18.0, |
|
"eval_LOCATION_f1": 0.7848101265822783, |
|
"eval_LOCATION_number": 73, |
|
"eval_LOCATION_precision": 0.7294117647058823, |
|
"eval_LOCATION_recall": 0.8493150684931506, |
|
"eval_ORGANIZATION_f1": 0.6, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.5052631578947369, |
|
"eval_ORGANIZATION_recall": 0.7384615384615385, |
|
"eval_PERSON_f1": 0.8698412698412699, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8303030303030303, |
|
"eval_PERSON_recall": 0.9133333333333333, |
|
"eval_QUANTITY_f1": 0.7575757575757576, |
|
"eval_QUANTITY_number": 29, |
|
"eval_QUANTITY_precision": 0.6756756756756757, |
|
"eval_QUANTITY_recall": 0.8620689655172413, |
|
"eval_TIME_f1": 0.8157894736842106, |
|
"eval_TIME_number": 34, |
|
"eval_TIME_precision": 0.7380952380952381, |
|
"eval_TIME_recall": 0.9117647058823529, |
|
"eval_loss": 0.1488378345966339, |
|
"eval_overall_accuracy": 0.9500369185331036, |
|
"eval_overall_f1": 0.7819354838709679, |
|
"eval_overall_precision": 0.714622641509434, |
|
"eval_overall_recall": 0.8632478632478633, |
|
"eval_runtime": 0.375, |
|
"eval_samples_per_second": 498.682, |
|
"eval_steps_per_second": 8.0, |
|
"step": 1908 |
|
}, |
|
{ |
|
"epoch": 19.0, |
|
"grad_norm": 0.9577983021736145, |
|
"learning_rate": 4.05e-05, |
|
"loss": 0.1332, |
|
"step": 2014 |
|
}, |
|
{ |
|
"epoch": 19.0, |
|
"eval_LOCATION_f1": 0.802547770700637, |
|
"eval_LOCATION_number": 73, |
|
"eval_LOCATION_precision": 0.75, |
|
"eval_LOCATION_recall": 0.863013698630137, |
|
"eval_ORGANIZATION_f1": 0.6296296296296297, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.5257731958762887, |
|
"eval_ORGANIZATION_recall": 0.7846153846153846, |
|
"eval_PERSON_f1": 0.8670886075949367, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8253012048192772, |
|
"eval_PERSON_recall": 0.9133333333333333, |
|
"eval_QUANTITY_f1": 0.6461538461538462, |
|
"eval_QUANTITY_number": 29, |
|
"eval_QUANTITY_precision": 0.5833333333333334, |
|
"eval_QUANTITY_recall": 0.7241379310344828, |
|
"eval_TIME_f1": 0.8266666666666665, |
|
"eval_TIME_number": 34, |
|
"eval_TIME_precision": 0.7560975609756098, |
|
"eval_TIME_recall": 0.9117647058823529, |
|
"eval_loss": 0.14682170748710632, |
|
"eval_overall_accuracy": 0.9512675363032242, |
|
"eval_overall_f1": 0.7819354838709679, |
|
"eval_overall_precision": 0.714622641509434, |
|
"eval_overall_recall": 0.8632478632478633, |
|
"eval_runtime": 0.3719, |
|
"eval_samples_per_second": 502.788, |
|
"eval_steps_per_second": 8.066, |
|
"step": 2014 |
|
}, |
|
{ |
|
"epoch": 20.0, |
|
"grad_norm": 1.0945817232131958, |
|
"learning_rate": 4e-05, |
|
"loss": 0.1258, |
|
"step": 2120 |
|
}, |
|
{ |
|
"epoch": 20.0, |
|
"eval_LOCATION_f1": 0.7974683544303799, |
|
"eval_LOCATION_number": 73, |
|
"eval_LOCATION_precision": 0.7411764705882353, |
|
"eval_LOCATION_recall": 0.863013698630137, |
|
"eval_ORGANIZATION_f1": 0.6216216216216216, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.5542168674698795, |
|
"eval_ORGANIZATION_recall": 0.7076923076923077, |
|
"eval_PERSON_f1": 0.8670886075949367, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8253012048192772, |
|
"eval_PERSON_recall": 0.9133333333333333, |
|
"eval_QUANTITY_f1": 0.7272727272727273, |
|
"eval_QUANTITY_number": 29, |
|
"eval_QUANTITY_precision": 0.6486486486486487, |
|
"eval_QUANTITY_recall": 0.8275862068965517, |
|
"eval_TIME_f1": 0.8266666666666665, |
|
"eval_TIME_number": 34, |
|
"eval_TIME_precision": 0.7560975609756098, |
|
"eval_TIME_recall": 0.9117647058823529, |
|
"eval_loss": 0.14338740706443787, |
|
"eval_overall_accuracy": 0.9527442776273689, |
|
"eval_overall_f1": 0.7889908256880734, |
|
"eval_overall_precision": 0.7305825242718447, |
|
"eval_overall_recall": 0.8575498575498576, |
|
"eval_runtime": 0.3718, |
|
"eval_samples_per_second": 502.95, |
|
"eval_steps_per_second": 8.069, |
|
"step": 2120 |
|
}, |
|
{ |
|
"epoch": 21.0, |
|
"grad_norm": 1.6282328367233276, |
|
"learning_rate": 3.9500000000000005e-05, |
|
"loss": 0.1231, |
|
"step": 2226 |
|
}, |
|
{ |
|
"epoch": 21.0, |
|
"eval_LOCATION_f1": 0.7848101265822783, |
|
"eval_LOCATION_number": 73, |
|
"eval_LOCATION_precision": 0.7294117647058823, |
|
"eval_LOCATION_recall": 0.8493150684931506, |
|
"eval_ORGANIZATION_f1": 0.625, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.569620253164557, |
|
"eval_ORGANIZATION_recall": 0.6923076923076923, |
|
"eval_PERSON_f1": 0.8643533123028392, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8203592814371258, |
|
"eval_PERSON_recall": 0.9133333333333333, |
|
"eval_QUANTITY_f1": 0.7076923076923076, |
|
"eval_QUANTITY_number": 29, |
|
"eval_QUANTITY_precision": 0.6388888888888888, |
|
"eval_QUANTITY_recall": 0.7931034482758621, |
|
"eval_TIME_f1": 0.8266666666666665, |
|
"eval_TIME_number": 34, |
|
"eval_TIME_precision": 0.7560975609756098, |
|
"eval_TIME_recall": 0.9117647058823529, |
|
"eval_loss": 0.1407139003276825, |
|
"eval_overall_accuracy": 0.9544671425055378, |
|
"eval_overall_f1": 0.785243741765481, |
|
"eval_overall_precision": 0.7303921568627451, |
|
"eval_overall_recall": 0.8490028490028491, |
|
"eval_runtime": 0.3796, |
|
"eval_samples_per_second": 492.652, |
|
"eval_steps_per_second": 7.904, |
|
"step": 2226 |
|
}, |
|
{ |
|
"epoch": 22.0, |
|
"grad_norm": 1.690437912940979, |
|
"learning_rate": 3.9000000000000006e-05, |
|
"loss": 0.1218, |
|
"step": 2332 |
|
}, |
|
{ |
|
"epoch": 22.0, |
|
"eval_LOCATION_f1": 0.759493670886076, |
|
"eval_LOCATION_number": 73, |
|
"eval_LOCATION_precision": 0.7058823529411765, |
|
"eval_LOCATION_recall": 0.821917808219178, |
|
"eval_ORGANIZATION_f1": 0.6144578313253013, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.504950495049505, |
|
"eval_ORGANIZATION_recall": 0.7846153846153846, |
|
"eval_PERSON_f1": 0.85625, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8058823529411765, |
|
"eval_PERSON_recall": 0.9133333333333333, |
|
"eval_QUANTITY_f1": 0.7076923076923076, |
|
"eval_QUANTITY_number": 29, |
|
"eval_QUANTITY_precision": 0.6388888888888888, |
|
"eval_QUANTITY_recall": 0.7931034482758621, |
|
"eval_TIME_f1": 0.8533333333333334, |
|
"eval_TIME_number": 34, |
|
"eval_TIME_precision": 0.7804878048780488, |
|
"eval_TIME_recall": 0.9411764705882353, |
|
"eval_loss": 0.14947740733623505, |
|
"eval_overall_accuracy": 0.9500369185331036, |
|
"eval_overall_f1": 0.7729591836734694, |
|
"eval_overall_precision": 0.6997690531177829, |
|
"eval_overall_recall": 0.8632478632478633, |
|
"eval_runtime": 0.3754, |
|
"eval_samples_per_second": 498.1, |
|
"eval_steps_per_second": 7.991, |
|
"step": 2332 |
|
}, |
|
{ |
|
"epoch": 23.0, |
|
"grad_norm": 1.4524682760238647, |
|
"learning_rate": 3.85e-05, |
|
"loss": 0.1189, |
|
"step": 2438 |
|
}, |
|
{ |
|
"epoch": 23.0, |
|
"eval_LOCATION_f1": 0.8076923076923077, |
|
"eval_LOCATION_number": 73, |
|
"eval_LOCATION_precision": 0.7590361445783133, |
|
"eval_LOCATION_recall": 0.863013698630137, |
|
"eval_ORGANIZATION_f1": 0.6451612903225806, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.5555555555555556, |
|
"eval_ORGANIZATION_recall": 0.7692307692307693, |
|
"eval_PERSON_f1": 0.8726114649681529, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8353658536585366, |
|
"eval_PERSON_recall": 0.9133333333333333, |
|
"eval_QUANTITY_f1": 0.696969696969697, |
|
"eval_QUANTITY_number": 29, |
|
"eval_QUANTITY_precision": 0.6216216216216216, |
|
"eval_QUANTITY_recall": 0.7931034482758621, |
|
"eval_TIME_f1": 0.8800000000000001, |
|
"eval_TIME_number": 34, |
|
"eval_TIME_precision": 0.8048780487804879, |
|
"eval_TIME_recall": 0.9705882352941176, |
|
"eval_loss": 0.13879932463169098, |
|
"eval_overall_accuracy": 0.9561900073837066, |
|
"eval_overall_f1": 0.7989556135770235, |
|
"eval_overall_precision": 0.7373493975903614, |
|
"eval_overall_recall": 0.8717948717948718, |
|
"eval_runtime": 0.3734, |
|
"eval_samples_per_second": 500.853, |
|
"eval_steps_per_second": 8.035, |
|
"step": 2438 |
|
}, |
|
{ |
|
"epoch": 24.0, |
|
"grad_norm": 1.4798812866210938, |
|
"learning_rate": 3.8e-05, |
|
"loss": 0.1176, |
|
"step": 2544 |
|
}, |
|
{ |
|
"epoch": 24.0, |
|
"eval_LOCATION_f1": 0.7848101265822783, |
|
"eval_LOCATION_number": 73, |
|
"eval_LOCATION_precision": 0.7294117647058823, |
|
"eval_LOCATION_recall": 0.8493150684931506, |
|
"eval_ORGANIZATION_f1": 0.6459627329192547, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.5416666666666666, |
|
"eval_ORGANIZATION_recall": 0.8, |
|
"eval_PERSON_f1": 0.8643533123028392, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8203592814371258, |
|
"eval_PERSON_recall": 0.9133333333333333, |
|
"eval_QUANTITY_f1": 0.7058823529411765, |
|
"eval_QUANTITY_number": 29, |
|
"eval_QUANTITY_precision": 0.6153846153846154, |
|
"eval_QUANTITY_recall": 0.8275862068965517, |
|
"eval_TIME_f1": 0.7894736842105262, |
|
"eval_TIME_number": 34, |
|
"eval_TIME_precision": 0.7142857142857143, |
|
"eval_TIME_recall": 0.8823529411764706, |
|
"eval_loss": 0.14802934229373932, |
|
"eval_overall_accuracy": 0.9522520305193207, |
|
"eval_overall_f1": 0.782051282051282, |
|
"eval_overall_precision": 0.710955710955711, |
|
"eval_overall_recall": 0.8689458689458689, |
|
"eval_runtime": 0.373, |
|
"eval_samples_per_second": 501.394, |
|
"eval_steps_per_second": 8.044, |
|
"step": 2544 |
|
}, |
|
{ |
|
"epoch": 25.0, |
|
"grad_norm": 1.3379883766174316, |
|
"learning_rate": 3.7500000000000003e-05, |
|
"loss": 0.115, |
|
"step": 2650 |
|
}, |
|
{ |
|
"epoch": 25.0, |
|
"eval_LOCATION_f1": 0.7777777777777778, |
|
"eval_LOCATION_number": 73, |
|
"eval_LOCATION_precision": 0.7078651685393258, |
|
"eval_LOCATION_recall": 0.863013698630137, |
|
"eval_ORGANIZATION_f1": 0.6335403726708075, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.53125, |
|
"eval_ORGANIZATION_recall": 0.7846153846153846, |
|
"eval_PERSON_f1": 0.8698412698412699, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8303030303030303, |
|
"eval_PERSON_recall": 0.9133333333333333, |
|
"eval_QUANTITY_f1": 0.7076923076923076, |
|
"eval_QUANTITY_number": 29, |
|
"eval_QUANTITY_precision": 0.6388888888888888, |
|
"eval_QUANTITY_recall": 0.7931034482758621, |
|
"eval_TIME_f1": 0.8266666666666665, |
|
"eval_TIME_number": 34, |
|
"eval_TIME_precision": 0.7560975609756098, |
|
"eval_TIME_recall": 0.9117647058823529, |
|
"eval_loss": 0.14569295942783356, |
|
"eval_overall_accuracy": 0.9534826482894413, |
|
"eval_overall_f1": 0.7840616966580978, |
|
"eval_overall_precision": 0.7142857142857143, |
|
"eval_overall_recall": 0.8689458689458689, |
|
"eval_runtime": 0.3725, |
|
"eval_samples_per_second": 502.079, |
|
"eval_steps_per_second": 8.055, |
|
"step": 2650 |
|
}, |
|
{ |
|
"epoch": 26.0, |
|
"grad_norm": 2.1995344161987305, |
|
"learning_rate": 3.7e-05, |
|
"loss": 0.1175, |
|
"step": 2756 |
|
}, |
|
{ |
|
"epoch": 26.0, |
|
"eval_LOCATION_f1": 0.7973856209150326, |
|
"eval_LOCATION_number": 73, |
|
"eval_LOCATION_precision": 0.7625, |
|
"eval_LOCATION_recall": 0.8356164383561644, |
|
"eval_ORGANIZATION_f1": 0.6308724832214766, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.5595238095238095, |
|
"eval_ORGANIZATION_recall": 0.7230769230769231, |
|
"eval_PERSON_f1": 0.879746835443038, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8373493975903614, |
|
"eval_PERSON_recall": 0.9266666666666666, |
|
"eval_QUANTITY_f1": 0.7058823529411765, |
|
"eval_QUANTITY_number": 29, |
|
"eval_QUANTITY_precision": 0.6153846153846154, |
|
"eval_QUANTITY_recall": 0.8275862068965517, |
|
"eval_TIME_f1": 0.8266666666666665, |
|
"eval_TIME_number": 34, |
|
"eval_TIME_precision": 0.7560975609756098, |
|
"eval_TIME_recall": 0.9117647058823529, |
|
"eval_loss": 0.14247295260429382, |
|
"eval_overall_accuracy": 0.9554516367216342, |
|
"eval_overall_f1": 0.7936925098554534, |
|
"eval_overall_precision": 0.7365853658536585, |
|
"eval_overall_recall": 0.8603988603988604, |
|
"eval_runtime": 0.3735, |
|
"eval_samples_per_second": 500.637, |
|
"eval_steps_per_second": 8.032, |
|
"step": 2756 |
|
}, |
|
{ |
|
"epoch": 27.0, |
|
"grad_norm": 1.194440484046936, |
|
"learning_rate": 3.65e-05, |
|
"loss": 0.1099, |
|
"step": 2862 |
|
}, |
|
{ |
|
"epoch": 27.0, |
|
"eval_LOCATION_f1": 0.7820512820512822, |
|
"eval_LOCATION_number": 73, |
|
"eval_LOCATION_precision": 0.7349397590361446, |
|
"eval_LOCATION_recall": 0.8356164383561644, |
|
"eval_ORGANIZATION_f1": 0.6883116883116883, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.5955056179775281, |
|
"eval_ORGANIZATION_recall": 0.8153846153846154, |
|
"eval_PERSON_f1": 0.8825396825396825, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8424242424242424, |
|
"eval_PERSON_recall": 0.9266666666666666, |
|
"eval_QUANTITY_f1": 0.6666666666666666, |
|
"eval_QUANTITY_number": 29, |
|
"eval_QUANTITY_precision": 0.575, |
|
"eval_QUANTITY_recall": 0.7931034482758621, |
|
"eval_TIME_f1": 0.8311688311688312, |
|
"eval_TIME_number": 34, |
|
"eval_TIME_precision": 0.7441860465116279, |
|
"eval_TIME_recall": 0.9411764705882353, |
|
"eval_loss": 0.14262671768665314, |
|
"eval_overall_accuracy": 0.9556977602756583, |
|
"eval_overall_f1": 0.7989623865110247, |
|
"eval_overall_precision": 0.7333333333333333, |
|
"eval_overall_recall": 0.8774928774928775, |
|
"eval_runtime": 0.3711, |
|
"eval_samples_per_second": 503.938, |
|
"eval_steps_per_second": 8.085, |
|
"step": 2862 |
|
}, |
|
{ |
|
"epoch": 28.0, |
|
"grad_norm": 1.36868155002594, |
|
"learning_rate": 3.6e-05, |
|
"loss": 0.1108, |
|
"step": 2968 |
|
}, |
|
{ |
|
"epoch": 28.0, |
|
"eval_LOCATION_f1": 0.7999999999999999, |
|
"eval_LOCATION_number": 73, |
|
"eval_LOCATION_precision": 0.7560975609756098, |
|
"eval_LOCATION_recall": 0.8493150684931506, |
|
"eval_ORGANIZATION_f1": 0.6842105263157896, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.5977011494252874, |
|
"eval_ORGANIZATION_recall": 0.8, |
|
"eval_PERSON_f1": 0.8706624605678233, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8263473053892215, |
|
"eval_PERSON_recall": 0.92, |
|
"eval_QUANTITY_f1": 0.6666666666666667, |
|
"eval_QUANTITY_number": 29, |
|
"eval_QUANTITY_precision": 0.5945945945945946, |
|
"eval_QUANTITY_recall": 0.7586206896551724, |
|
"eval_TIME_f1": 0.8266666666666665, |
|
"eval_TIME_number": 34, |
|
"eval_TIME_precision": 0.7560975609756098, |
|
"eval_TIME_recall": 0.9117647058823529, |
|
"eval_loss": 0.1398727297782898, |
|
"eval_overall_accuracy": 0.9554516367216342, |
|
"eval_overall_f1": 0.7973856209150327, |
|
"eval_overall_precision": 0.7367149758454107, |
|
"eval_overall_recall": 0.8689458689458689, |
|
"eval_runtime": 0.3749, |
|
"eval_samples_per_second": 498.749, |
|
"eval_steps_per_second": 8.001, |
|
"step": 2968 |
|
}, |
|
{ |
|
"epoch": 29.0, |
|
"grad_norm": 0.8069501519203186, |
|
"learning_rate": 3.55e-05, |
|
"loss": 0.1071, |
|
"step": 3074 |
|
}, |
|
{ |
|
"epoch": 29.0, |
|
"eval_LOCATION_f1": 0.782608695652174, |
|
"eval_LOCATION_number": 73, |
|
"eval_LOCATION_precision": 0.7159090909090909, |
|
"eval_LOCATION_recall": 0.863013698630137, |
|
"eval_ORGANIZATION_f1": 0.6506024096385542, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.5346534653465347, |
|
"eval_ORGANIZATION_recall": 0.8307692307692308, |
|
"eval_PERSON_f1": 0.877742946708464, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8284023668639053, |
|
"eval_PERSON_recall": 0.9333333333333333, |
|
"eval_QUANTITY_f1": 0.716417910447761, |
|
"eval_QUANTITY_number": 29, |
|
"eval_QUANTITY_precision": 0.631578947368421, |
|
"eval_QUANTITY_recall": 0.8275862068965517, |
|
"eval_TIME_f1": 0.8421052631578947, |
|
"eval_TIME_number": 34, |
|
"eval_TIME_precision": 0.7619047619047619, |
|
"eval_TIME_recall": 0.9411764705882353, |
|
"eval_loss": 0.14704711735248566, |
|
"eval_overall_accuracy": 0.9512675363032242, |
|
"eval_overall_f1": 0.7934093789607097, |
|
"eval_overall_precision": 0.7146118721461188, |
|
"eval_overall_recall": 0.8917378917378918, |
|
"eval_runtime": 0.3733, |
|
"eval_samples_per_second": 500.911, |
|
"eval_steps_per_second": 8.036, |
|
"step": 3074 |
|
}, |
|
{ |
|
"epoch": 30.0, |
|
"grad_norm": 1.9499945640563965, |
|
"learning_rate": 3.5e-05, |
|
"loss": 0.1075, |
|
"step": 3180 |
|
}, |
|
{ |
|
"epoch": 30.0, |
|
"eval_LOCATION_f1": 0.7999999999999999, |
|
"eval_LOCATION_number": 73, |
|
"eval_LOCATION_precision": 0.7560975609756098, |
|
"eval_LOCATION_recall": 0.8493150684931506, |
|
"eval_ORGANIZATION_f1": 0.6714285714285715, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6266666666666667, |
|
"eval_ORGANIZATION_recall": 0.7230769230769231, |
|
"eval_PERSON_f1": 0.8616352201257862, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8154761904761905, |
|
"eval_PERSON_recall": 0.9133333333333333, |
|
"eval_QUANTITY_f1": 0.6461538461538462, |
|
"eval_QUANTITY_number": 29, |
|
"eval_QUANTITY_precision": 0.5833333333333334, |
|
"eval_QUANTITY_recall": 0.7241379310344828, |
|
"eval_TIME_f1": 0.9041095890410958, |
|
"eval_TIME_number": 34, |
|
"eval_TIME_precision": 0.8461538461538461, |
|
"eval_TIME_recall": 0.9705882352941176, |
|
"eval_loss": 0.13154004514217377, |
|
"eval_overall_accuracy": 0.956928378045779, |
|
"eval_overall_f1": 0.7989347536617842, |
|
"eval_overall_precision": 0.75, |
|
"eval_overall_recall": 0.8547008547008547, |
|
"eval_runtime": 0.3718, |
|
"eval_samples_per_second": 502.965, |
|
"eval_steps_per_second": 8.069, |
|
"step": 3180 |
|
}, |
|
{ |
|
"epoch": 31.0, |
|
"grad_norm": 0.5096124410629272, |
|
"learning_rate": 3.45e-05, |
|
"loss": 0.1053, |
|
"step": 3286 |
|
}, |
|
{ |
|
"epoch": 31.0, |
|
"eval_LOCATION_f1": 0.8051948051948052, |
|
"eval_LOCATION_number": 73, |
|
"eval_LOCATION_precision": 0.7654320987654321, |
|
"eval_LOCATION_recall": 0.8493150684931506, |
|
"eval_ORGANIZATION_f1": 0.6753246753246754, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.5842696629213483, |
|
"eval_ORGANIZATION_recall": 0.8, |
|
"eval_PERSON_f1": 0.879746835443038, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8373493975903614, |
|
"eval_PERSON_recall": 0.9266666666666666, |
|
"eval_QUANTITY_f1": 0.676470588235294, |
|
"eval_QUANTITY_number": 29, |
|
"eval_QUANTITY_precision": 0.5897435897435898, |
|
"eval_QUANTITY_recall": 0.7931034482758621, |
|
"eval_TIME_f1": 0.8266666666666665, |
|
"eval_TIME_number": 34, |
|
"eval_TIME_precision": 0.7560975609756098, |
|
"eval_TIME_recall": 0.9117647058823529, |
|
"eval_loss": 0.1396467238664627, |
|
"eval_overall_accuracy": 0.9554516367216342, |
|
"eval_overall_f1": 0.8005215123859191, |
|
"eval_overall_precision": 0.7379807692307693, |
|
"eval_overall_recall": 0.8746438746438746, |
|
"eval_runtime": 0.373, |
|
"eval_samples_per_second": 501.294, |
|
"eval_steps_per_second": 8.042, |
|
"step": 3286 |
|
}, |
|
{ |
|
"epoch": 32.0, |
|
"grad_norm": 0.622959554195404, |
|
"learning_rate": 3.4000000000000007e-05, |
|
"loss": 0.1027, |
|
"step": 3392 |
|
}, |
|
{ |
|
"epoch": 32.0, |
|
"eval_LOCATION_f1": 0.8129032258064516, |
|
"eval_LOCATION_number": 73, |
|
"eval_LOCATION_precision": 0.7682926829268293, |
|
"eval_LOCATION_recall": 0.863013698630137, |
|
"eval_ORGANIZATION_f1": 0.6748466257668712, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.5612244897959183, |
|
"eval_ORGANIZATION_recall": 0.8461538461538461, |
|
"eval_PERSON_f1": 0.879746835443038, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8373493975903614, |
|
"eval_PERSON_recall": 0.9266666666666666, |
|
"eval_QUANTITY_f1": 0.696969696969697, |
|
"eval_QUANTITY_number": 29, |
|
"eval_QUANTITY_precision": 0.6216216216216216, |
|
"eval_QUANTITY_recall": 0.7931034482758621, |
|
"eval_TIME_f1": 0.8533333333333334, |
|
"eval_TIME_number": 34, |
|
"eval_TIME_precision": 0.7804878048780488, |
|
"eval_TIME_recall": 0.9411764705882353, |
|
"eval_loss": 0.14285185933113098, |
|
"eval_overall_accuracy": 0.9549593896135861, |
|
"eval_overall_f1": 0.8051612903225805, |
|
"eval_overall_precision": 0.7358490566037735, |
|
"eval_overall_recall": 0.8888888888888888, |
|
"eval_runtime": 0.371, |
|
"eval_samples_per_second": 504.003, |
|
"eval_steps_per_second": 8.086, |
|
"step": 3392 |
|
}, |
|
{ |
|
"epoch": 33.0, |
|
"grad_norm": 1.2904415130615234, |
|
"learning_rate": 3.35e-05, |
|
"loss": 0.1036, |
|
"step": 3498 |
|
}, |
|
{ |
|
"epoch": 33.0, |
|
"eval_LOCATION_f1": 0.8051948051948052, |
|
"eval_LOCATION_number": 73, |
|
"eval_LOCATION_precision": 0.7654320987654321, |
|
"eval_LOCATION_recall": 0.8493150684931506, |
|
"eval_ORGANIZATION_f1": 0.6878980891719746, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.5869565217391305, |
|
"eval_ORGANIZATION_recall": 0.8307692307692308, |
|
"eval_PERSON_f1": 0.8734177215189873, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8313253012048193, |
|
"eval_PERSON_recall": 0.92, |
|
"eval_QUANTITY_f1": 0.716417910447761, |
|
"eval_QUANTITY_number": 29, |
|
"eval_QUANTITY_precision": 0.631578947368421, |
|
"eval_QUANTITY_recall": 0.8275862068965517, |
|
"eval_TIME_f1": 0.8378378378378379, |
|
"eval_TIME_number": 34, |
|
"eval_TIME_precision": 0.775, |
|
"eval_TIME_recall": 0.9117647058823529, |
|
"eval_loss": 0.1392923891544342, |
|
"eval_overall_accuracy": 0.9559438838296825, |
|
"eval_overall_f1": 0.8046875000000001, |
|
"eval_overall_precision": 0.7410071942446043, |
|
"eval_overall_recall": 0.8803418803418803, |
|
"eval_runtime": 0.3722, |
|
"eval_samples_per_second": 502.408, |
|
"eval_steps_per_second": 8.06, |
|
"step": 3498 |
|
}, |
|
{ |
|
"epoch": 34.0, |
|
"grad_norm": 3.785581350326538, |
|
"learning_rate": 3.3e-05, |
|
"loss": 0.1, |
|
"step": 3604 |
|
}, |
|
{ |
|
"epoch": 34.0, |
|
"eval_LOCATION_f1": 0.7999999999999999, |
|
"eval_LOCATION_number": 73, |
|
"eval_LOCATION_precision": 0.7560975609756098, |
|
"eval_LOCATION_recall": 0.8493150684931506, |
|
"eval_ORGANIZATION_f1": 0.6838709677419356, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.5888888888888889, |
|
"eval_ORGANIZATION_recall": 0.8153846153846154, |
|
"eval_PERSON_f1": 0.8734177215189873, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8313253012048193, |
|
"eval_PERSON_recall": 0.92, |
|
"eval_QUANTITY_f1": 0.6865671641791046, |
|
"eval_QUANTITY_number": 29, |
|
"eval_QUANTITY_precision": 0.6052631578947368, |
|
"eval_QUANTITY_recall": 0.7931034482758621, |
|
"eval_TIME_f1": 0.8533333333333334, |
|
"eval_TIME_number": 34, |
|
"eval_TIME_precision": 0.7804878048780488, |
|
"eval_TIME_recall": 0.9411764705882353, |
|
"eval_loss": 0.13862958550453186, |
|
"eval_overall_accuracy": 0.9561900073837066, |
|
"eval_overall_f1": 0.8020833333333333, |
|
"eval_overall_precision": 0.7386091127098321, |
|
"eval_overall_recall": 0.8774928774928775, |
|
"eval_runtime": 0.3727, |
|
"eval_samples_per_second": 501.785, |
|
"eval_steps_per_second": 8.05, |
|
"step": 3604 |
|
}, |
|
{ |
|
"epoch": 35.0, |
|
"grad_norm": 0.7286350131034851, |
|
"learning_rate": 3.2500000000000004e-05, |
|
"loss": 0.1013, |
|
"step": 3710 |
|
}, |
|
{ |
|
"epoch": 35.0, |
|
"eval_LOCATION_f1": 0.7948717948717949, |
|
"eval_LOCATION_number": 73, |
|
"eval_LOCATION_precision": 0.7469879518072289, |
|
"eval_LOCATION_recall": 0.8493150684931506, |
|
"eval_ORGANIZATION_f1": 0.6875, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.5789473684210527, |
|
"eval_ORGANIZATION_recall": 0.8461538461538461, |
|
"eval_PERSON_f1": 0.8734177215189873, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8313253012048193, |
|
"eval_PERSON_recall": 0.92, |
|
"eval_QUANTITY_f1": 0.6956521739130435, |
|
"eval_QUANTITY_number": 29, |
|
"eval_QUANTITY_precision": 0.6, |
|
"eval_QUANTITY_recall": 0.8275862068965517, |
|
"eval_TIME_f1": 0.8266666666666665, |
|
"eval_TIME_number": 34, |
|
"eval_TIME_precision": 0.7560975609756098, |
|
"eval_TIME_recall": 0.9117647058823529, |
|
"eval_loss": 0.1437290757894516, |
|
"eval_overall_accuracy": 0.9549593896135861, |
|
"eval_overall_f1": 0.7989690721649485, |
|
"eval_overall_precision": 0.7294117647058823, |
|
"eval_overall_recall": 0.8831908831908832, |
|
"eval_runtime": 0.3727, |
|
"eval_samples_per_second": 501.777, |
|
"eval_steps_per_second": 8.05, |
|
"step": 3710 |
|
}, |
|
{ |
|
"epoch": 36.0, |
|
"grad_norm": 0.8509505391120911, |
|
"learning_rate": 3.2000000000000005e-05, |
|
"loss": 0.0988, |
|
"step": 3816 |
|
}, |
|
{ |
|
"epoch": 36.0, |
|
"eval_LOCATION_f1": 0.7870967741935484, |
|
"eval_LOCATION_number": 73, |
|
"eval_LOCATION_precision": 0.7439024390243902, |
|
"eval_LOCATION_recall": 0.8356164383561644, |
|
"eval_ORGANIZATION_f1": 0.6794871794871795, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.5824175824175825, |
|
"eval_ORGANIZATION_recall": 0.8153846153846154, |
|
"eval_PERSON_f1": 0.8761904761904761, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8363636363636363, |
|
"eval_PERSON_recall": 0.92, |
|
"eval_QUANTITY_f1": 0.676470588235294, |
|
"eval_QUANTITY_number": 29, |
|
"eval_QUANTITY_precision": 0.5897435897435898, |
|
"eval_QUANTITY_recall": 0.7931034482758621, |
|
"eval_TIME_f1": 0.8266666666666665, |
|
"eval_TIME_number": 34, |
|
"eval_TIME_precision": 0.7560975609756098, |
|
"eval_TIME_recall": 0.9117647058823529, |
|
"eval_loss": 0.14367760717868805, |
|
"eval_overall_accuracy": 0.9547132660595619, |
|
"eval_overall_f1": 0.7958387516254878, |
|
"eval_overall_precision": 0.7320574162679426, |
|
"eval_overall_recall": 0.8717948717948718, |
|
"eval_runtime": 0.3724, |
|
"eval_samples_per_second": 502.107, |
|
"eval_steps_per_second": 8.055, |
|
"step": 3816 |
|
}, |
|
{ |
|
"epoch": 37.0, |
|
"grad_norm": 1.2342133522033691, |
|
"learning_rate": 3.15e-05, |
|
"loss": 0.0971, |
|
"step": 3922 |
|
}, |
|
{ |
|
"epoch": 37.0, |
|
"eval_LOCATION_f1": 0.7770700636942677, |
|
"eval_LOCATION_number": 73, |
|
"eval_LOCATION_precision": 0.7261904761904762, |
|
"eval_LOCATION_recall": 0.8356164383561644, |
|
"eval_ORGANIZATION_f1": 0.6705882352941177, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.5428571428571428, |
|
"eval_ORGANIZATION_recall": 0.8769230769230769, |
|
"eval_PERSON_f1": 0.8706624605678233, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8263473053892215, |
|
"eval_PERSON_recall": 0.92, |
|
"eval_QUANTITY_f1": 0.676470588235294, |
|
"eval_QUANTITY_number": 29, |
|
"eval_QUANTITY_precision": 0.5897435897435898, |
|
"eval_QUANTITY_recall": 0.7931034482758621, |
|
"eval_TIME_f1": 0.8, |
|
"eval_TIME_number": 34, |
|
"eval_TIME_precision": 0.7317073170731707, |
|
"eval_TIME_recall": 0.8823529411764706, |
|
"eval_loss": 0.1551184207201004, |
|
"eval_overall_accuracy": 0.9490524243170071, |
|
"eval_overall_f1": 0.7852604828462516, |
|
"eval_overall_precision": 0.7087155963302753, |
|
"eval_overall_recall": 0.8803418803418803, |
|
"eval_runtime": 0.3737, |
|
"eval_samples_per_second": 500.4, |
|
"eval_steps_per_second": 8.028, |
|
"step": 3922 |
|
}, |
|
{ |
|
"epoch": 38.0, |
|
"grad_norm": 1.0431395769119263, |
|
"learning_rate": 3.1e-05, |
|
"loss": 0.0967, |
|
"step": 4028 |
|
}, |
|
{ |
|
"epoch": 38.0, |
|
"eval_LOCATION_f1": 0.7973856209150326, |
|
"eval_LOCATION_number": 73, |
|
"eval_LOCATION_precision": 0.7625, |
|
"eval_LOCATION_recall": 0.8356164383561644, |
|
"eval_ORGANIZATION_f1": 0.6805555555555556, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.620253164556962, |
|
"eval_ORGANIZATION_recall": 0.7538461538461538, |
|
"eval_PERSON_f1": 0.8761904761904761, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8363636363636363, |
|
"eval_PERSON_recall": 0.92, |
|
"eval_QUANTITY_f1": 0.6865671641791046, |
|
"eval_QUANTITY_number": 29, |
|
"eval_QUANTITY_precision": 0.6052631578947368, |
|
"eval_QUANTITY_recall": 0.7931034482758621, |
|
"eval_TIME_f1": 0.8378378378378379, |
|
"eval_TIME_number": 34, |
|
"eval_TIME_precision": 0.775, |
|
"eval_TIME_recall": 0.9117647058823529, |
|
"eval_loss": 0.13686208426952362, |
|
"eval_overall_accuracy": 0.956928378045779, |
|
"eval_overall_f1": 0.802124833997344, |
|
"eval_overall_precision": 0.7512437810945274, |
|
"eval_overall_recall": 0.8603988603988604, |
|
"eval_runtime": 0.3727, |
|
"eval_samples_per_second": 501.728, |
|
"eval_steps_per_second": 8.049, |
|
"step": 4028 |
|
}, |
|
{ |
|
"epoch": 39.0, |
|
"grad_norm": 1.3837076425552368, |
|
"learning_rate": 3.05e-05, |
|
"loss": 0.0949, |
|
"step": 4134 |
|
}, |
|
{ |
|
"epoch": 39.0, |
|
"eval_LOCATION_f1": 0.7898089171974523, |
|
"eval_LOCATION_number": 73, |
|
"eval_LOCATION_precision": 0.7380952380952381, |
|
"eval_LOCATION_recall": 0.8493150684931506, |
|
"eval_ORGANIZATION_f1": 0.6832298136645962, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.5729166666666666, |
|
"eval_ORGANIZATION_recall": 0.8461538461538461, |
|
"eval_PERSON_f1": 0.8761904761904761, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8363636363636363, |
|
"eval_PERSON_recall": 0.92, |
|
"eval_QUANTITY_f1": 0.6666666666666667, |
|
"eval_QUANTITY_number": 29, |
|
"eval_QUANTITY_precision": 0.5945945945945946, |
|
"eval_QUANTITY_recall": 0.7586206896551724, |
|
"eval_TIME_f1": 0.8266666666666665, |
|
"eval_TIME_number": 34, |
|
"eval_TIME_precision": 0.7560975609756098, |
|
"eval_TIME_recall": 0.9117647058823529, |
|
"eval_loss": 0.13983625173568726, |
|
"eval_overall_accuracy": 0.9559438838296825, |
|
"eval_overall_f1": 0.7958656330749354, |
|
"eval_overall_precision": 0.7281323877068558, |
|
"eval_overall_recall": 0.8774928774928775, |
|
"eval_runtime": 0.3721, |
|
"eval_samples_per_second": 502.567, |
|
"eval_steps_per_second": 8.063, |
|
"step": 4134 |
|
}, |
|
{ |
|
"epoch": 40.0, |
|
"grad_norm": 0.6632676124572754, |
|
"learning_rate": 3e-05, |
|
"loss": 0.0956, |
|
"step": 4240 |
|
}, |
|
{ |
|
"epoch": 40.0, |
|
"eval_LOCATION_f1": 0.7770700636942677, |
|
"eval_LOCATION_number": 73, |
|
"eval_LOCATION_precision": 0.7261904761904762, |
|
"eval_LOCATION_recall": 0.8356164383561644, |
|
"eval_ORGANIZATION_f1": 0.6973684210526315, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6091954022988506, |
|
"eval_ORGANIZATION_recall": 0.8153846153846154, |
|
"eval_PERSON_f1": 0.8789808917197452, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8414634146341463, |
|
"eval_PERSON_recall": 0.92, |
|
"eval_QUANTITY_f1": 0.676470588235294, |
|
"eval_QUANTITY_number": 29, |
|
"eval_QUANTITY_precision": 0.5897435897435898, |
|
"eval_QUANTITY_recall": 0.7931034482758621, |
|
"eval_TIME_f1": 0.8378378378378379, |
|
"eval_TIME_number": 34, |
|
"eval_TIME_precision": 0.775, |
|
"eval_TIME_recall": 0.9117647058823529, |
|
"eval_loss": 0.14134033024311066, |
|
"eval_overall_accuracy": 0.9559438838296825, |
|
"eval_overall_f1": 0.7999999999999999, |
|
"eval_overall_precision": 0.7391304347826086, |
|
"eval_overall_recall": 0.8717948717948718, |
|
"eval_runtime": 0.3777, |
|
"eval_samples_per_second": 495.154, |
|
"eval_steps_per_second": 7.944, |
|
"step": 4240 |
|
}, |
|
{ |
|
"epoch": 41.0, |
|
"grad_norm": 0.36149993538856506, |
|
"learning_rate": 2.95e-05, |
|
"loss": 0.0913, |
|
"step": 4346 |
|
}, |
|
{ |
|
"epoch": 41.0, |
|
"eval_LOCATION_f1": 0.7898089171974523, |
|
"eval_LOCATION_number": 73, |
|
"eval_LOCATION_precision": 0.7380952380952381, |
|
"eval_LOCATION_recall": 0.8493150684931506, |
|
"eval_ORGANIZATION_f1": 0.7051282051282052, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6043956043956044, |
|
"eval_ORGANIZATION_recall": 0.8461538461538461, |
|
"eval_PERSON_f1": 0.8789808917197452, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8414634146341463, |
|
"eval_PERSON_recall": 0.92, |
|
"eval_QUANTITY_f1": 0.6865671641791046, |
|
"eval_QUANTITY_number": 29, |
|
"eval_QUANTITY_precision": 0.6052631578947368, |
|
"eval_QUANTITY_recall": 0.7931034482758621, |
|
"eval_TIME_f1": 0.8266666666666665, |
|
"eval_TIME_number": 34, |
|
"eval_TIME_precision": 0.7560975609756098, |
|
"eval_TIME_recall": 0.9117647058823529, |
|
"eval_loss": 0.13970939815044403, |
|
"eval_overall_accuracy": 0.9566822544917548, |
|
"eval_overall_f1": 0.8036410923276982, |
|
"eval_overall_precision": 0.7392344497607656, |
|
"eval_overall_recall": 0.8803418803418803, |
|
"eval_runtime": 0.3722, |
|
"eval_samples_per_second": 502.411, |
|
"eval_steps_per_second": 8.06, |
|
"step": 4346 |
|
}, |
|
{ |
|
"epoch": 42.0, |
|
"grad_norm": 0.5602841377258301, |
|
"learning_rate": 2.9e-05, |
|
"loss": 0.0949, |
|
"step": 4452 |
|
}, |
|
{ |
|
"epoch": 42.0, |
|
"eval_LOCATION_f1": 0.7870967741935484, |
|
"eval_LOCATION_number": 73, |
|
"eval_LOCATION_precision": 0.7439024390243902, |
|
"eval_LOCATION_recall": 0.8356164383561644, |
|
"eval_ORGANIZATION_f1": 0.6923076923076923, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.5934065934065934, |
|
"eval_ORGANIZATION_recall": 0.8307692307692308, |
|
"eval_PERSON_f1": 0.8846153846153846, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8518518518518519, |
|
"eval_PERSON_recall": 0.92, |
|
"eval_QUANTITY_f1": 0.676470588235294, |
|
"eval_QUANTITY_number": 29, |
|
"eval_QUANTITY_precision": 0.5897435897435898, |
|
"eval_QUANTITY_recall": 0.7931034482758621, |
|
"eval_TIME_f1": 0.8378378378378379, |
|
"eval_TIME_number": 34, |
|
"eval_TIME_precision": 0.775, |
|
"eval_TIME_recall": 0.9117647058823529, |
|
"eval_loss": 0.1462649405002594, |
|
"eval_overall_accuracy": 0.9547132660595619, |
|
"eval_overall_f1": 0.8026143790849672, |
|
"eval_overall_precision": 0.7415458937198067, |
|
"eval_overall_recall": 0.8746438746438746, |
|
"eval_runtime": 0.3742, |
|
"eval_samples_per_second": 499.754, |
|
"eval_steps_per_second": 8.017, |
|
"step": 4452 |
|
}, |
|
{ |
|
"epoch": 43.0, |
|
"grad_norm": 0.9771382808685303, |
|
"learning_rate": 2.8499999999999998e-05, |
|
"loss": 0.0919, |
|
"step": 4558 |
|
}, |
|
{ |
|
"epoch": 43.0, |
|
"eval_LOCATION_f1": 0.7820512820512822, |
|
"eval_LOCATION_number": 73, |
|
"eval_LOCATION_precision": 0.7349397590361446, |
|
"eval_LOCATION_recall": 0.8356164383561644, |
|
"eval_ORGANIZATION_f1": 0.684931506849315, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6172839506172839, |
|
"eval_ORGANIZATION_recall": 0.7692307692307693, |
|
"eval_PERSON_f1": 0.8789808917197452, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8414634146341463, |
|
"eval_PERSON_recall": 0.92, |
|
"eval_QUANTITY_f1": 0.6666666666666667, |
|
"eval_QUANTITY_number": 29, |
|
"eval_QUANTITY_precision": 0.5945945945945946, |
|
"eval_QUANTITY_recall": 0.7586206896551724, |
|
"eval_TIME_f1": 0.8266666666666665, |
|
"eval_TIME_number": 34, |
|
"eval_TIME_precision": 0.7560975609756098, |
|
"eval_TIME_recall": 0.9117647058823529, |
|
"eval_loss": 0.1370939314365387, |
|
"eval_overall_accuracy": 0.9566822544917548, |
|
"eval_overall_f1": 0.7978863936591809, |
|
"eval_overall_precision": 0.7438423645320197, |
|
"eval_overall_recall": 0.8603988603988604, |
|
"eval_runtime": 0.3709, |
|
"eval_samples_per_second": 504.137, |
|
"eval_steps_per_second": 8.088, |
|
"step": 4558 |
|
}, |
|
{ |
|
"epoch": 44.0, |
|
"grad_norm": 3.2234935760498047, |
|
"learning_rate": 2.8000000000000003e-05, |
|
"loss": 0.0895, |
|
"step": 4664 |
|
}, |
|
{ |
|
"epoch": 44.0, |
|
"eval_LOCATION_f1": 0.7999999999999999, |
|
"eval_LOCATION_number": 73, |
|
"eval_LOCATION_precision": 0.7560975609756098, |
|
"eval_LOCATION_recall": 0.8493150684931506, |
|
"eval_ORGANIZATION_f1": 0.6758620689655173, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6125, |
|
"eval_ORGANIZATION_recall": 0.7538461538461538, |
|
"eval_PERSON_f1": 0.8825396825396825, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8424242424242424, |
|
"eval_PERSON_recall": 0.9266666666666666, |
|
"eval_QUANTITY_f1": 0.6865671641791046, |
|
"eval_QUANTITY_number": 29, |
|
"eval_QUANTITY_precision": 0.6052631578947368, |
|
"eval_QUANTITY_recall": 0.7931034482758621, |
|
"eval_TIME_f1": 0.8648648648648648, |
|
"eval_TIME_number": 34, |
|
"eval_TIME_precision": 0.8, |
|
"eval_TIME_recall": 0.9411764705882353, |
|
"eval_loss": 0.1338210105895996, |
|
"eval_overall_accuracy": 0.9576667487078513, |
|
"eval_overall_f1": 0.8068783068783069, |
|
"eval_overall_precision": 0.7530864197530864, |
|
"eval_overall_recall": 0.8689458689458689, |
|
"eval_runtime": 0.3714, |
|
"eval_samples_per_second": 503.565, |
|
"eval_steps_per_second": 8.079, |
|
"step": 4664 |
|
}, |
|
{ |
|
"epoch": 45.0, |
|
"grad_norm": 3.458214282989502, |
|
"learning_rate": 2.7500000000000004e-05, |
|
"loss": 0.0899, |
|
"step": 4770 |
|
}, |
|
{ |
|
"epoch": 45.0, |
|
"eval_LOCATION_f1": 0.7792207792207793, |
|
"eval_LOCATION_number": 73, |
|
"eval_LOCATION_precision": 0.7407407407407407, |
|
"eval_LOCATION_recall": 0.821917808219178, |
|
"eval_ORGANIZATION_f1": 0.6835443037974683, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.5806451612903226, |
|
"eval_ORGANIZATION_recall": 0.8307692307692308, |
|
"eval_PERSON_f1": 0.8789808917197452, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8414634146341463, |
|
"eval_PERSON_recall": 0.92, |
|
"eval_QUANTITY_f1": 0.6666666666666667, |
|
"eval_QUANTITY_number": 29, |
|
"eval_QUANTITY_precision": 0.5945945945945946, |
|
"eval_QUANTITY_recall": 0.7586206896551724, |
|
"eval_TIME_f1": 0.8533333333333334, |
|
"eval_TIME_number": 34, |
|
"eval_TIME_precision": 0.7804878048780488, |
|
"eval_TIME_recall": 0.9411764705882353, |
|
"eval_loss": 0.14024274051189423, |
|
"eval_overall_accuracy": 0.956928378045779, |
|
"eval_overall_f1": 0.7979139504563233, |
|
"eval_overall_precision": 0.7355769230769231, |
|
"eval_overall_recall": 0.8717948717948718, |
|
"eval_runtime": 0.4103, |
|
"eval_samples_per_second": 455.728, |
|
"eval_steps_per_second": 7.311, |
|
"step": 4770 |
|
}, |
|
{ |
|
"epoch": 46.0, |
|
"grad_norm": 1.2206172943115234, |
|
"learning_rate": 2.7000000000000002e-05, |
|
"loss": 0.088, |
|
"step": 4876 |
|
}, |
|
{ |
|
"epoch": 46.0, |
|
"eval_LOCATION_f1": 0.7922077922077922, |
|
"eval_LOCATION_number": 73, |
|
"eval_LOCATION_precision": 0.7530864197530864, |
|
"eval_LOCATION_recall": 0.8356164383561644, |
|
"eval_ORGANIZATION_f1": 0.7019867549668873, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6162790697674418, |
|
"eval_ORGANIZATION_recall": 0.8153846153846154, |
|
"eval_PERSON_f1": 0.8846153846153846, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8518518518518519, |
|
"eval_PERSON_recall": 0.92, |
|
"eval_QUANTITY_f1": 0.6461538461538462, |
|
"eval_QUANTITY_number": 29, |
|
"eval_QUANTITY_precision": 0.5833333333333334, |
|
"eval_QUANTITY_recall": 0.7241379310344828, |
|
"eval_TIME_f1": 0.8648648648648648, |
|
"eval_TIME_number": 34, |
|
"eval_TIME_precision": 0.8, |
|
"eval_TIME_recall": 0.9411764705882353, |
|
"eval_loss": 0.1336318403482437, |
|
"eval_overall_accuracy": 0.9584051193699237, |
|
"eval_overall_f1": 0.8068783068783069, |
|
"eval_overall_precision": 0.7530864197530864, |
|
"eval_overall_recall": 0.8689458689458689, |
|
"eval_runtime": 0.3724, |
|
"eval_samples_per_second": 502.143, |
|
"eval_steps_per_second": 8.056, |
|
"step": 4876 |
|
}, |
|
{ |
|
"epoch": 47.0, |
|
"grad_norm": 1.561812162399292, |
|
"learning_rate": 2.6500000000000004e-05, |
|
"loss": 0.0896, |
|
"step": 4982 |
|
}, |
|
{ |
|
"epoch": 47.0, |
|
"eval_LOCATION_f1": 0.7770700636942677, |
|
"eval_LOCATION_number": 73, |
|
"eval_LOCATION_precision": 0.7261904761904762, |
|
"eval_LOCATION_recall": 0.8356164383561644, |
|
"eval_ORGANIZATION_f1": 0.7, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.5894736842105263, |
|
"eval_ORGANIZATION_recall": 0.8615384615384616, |
|
"eval_PERSON_f1": 0.8853503184713376, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8475609756097561, |
|
"eval_PERSON_recall": 0.9266666666666666, |
|
"eval_QUANTITY_f1": 0.7076923076923076, |
|
"eval_QUANTITY_number": 29, |
|
"eval_QUANTITY_precision": 0.6388888888888888, |
|
"eval_QUANTITY_recall": 0.7931034482758621, |
|
"eval_TIME_f1": 0.8421052631578947, |
|
"eval_TIME_number": 34, |
|
"eval_TIME_precision": 0.7619047619047619, |
|
"eval_TIME_recall": 0.9411764705882353, |
|
"eval_loss": 0.14269451797008514, |
|
"eval_overall_accuracy": 0.9561900073837066, |
|
"eval_overall_f1": 0.805699481865285, |
|
"eval_overall_precision": 0.7387173396674585, |
|
"eval_overall_recall": 0.886039886039886, |
|
"eval_runtime": 0.3722, |
|
"eval_samples_per_second": 502.433, |
|
"eval_steps_per_second": 8.06, |
|
"step": 4982 |
|
}, |
|
{ |
|
"epoch": 48.0, |
|
"grad_norm": 3.845472812652588, |
|
"learning_rate": 2.6000000000000002e-05, |
|
"loss": 0.0897, |
|
"step": 5088 |
|
}, |
|
{ |
|
"epoch": 48.0, |
|
"eval_LOCATION_f1": 0.7672955974842768, |
|
"eval_LOCATION_number": 73, |
|
"eval_LOCATION_precision": 0.7093023255813954, |
|
"eval_LOCATION_recall": 0.8356164383561644, |
|
"eval_ORGANIZATION_f1": 0.7019867549668873, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6162790697674418, |
|
"eval_ORGANIZATION_recall": 0.8153846153846154, |
|
"eval_PERSON_f1": 0.8825396825396825, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8424242424242424, |
|
"eval_PERSON_recall": 0.9266666666666666, |
|
"eval_QUANTITY_f1": 0.676470588235294, |
|
"eval_QUANTITY_number": 29, |
|
"eval_QUANTITY_precision": 0.5897435897435898, |
|
"eval_QUANTITY_recall": 0.7931034482758621, |
|
"eval_TIME_f1": 0.8157894736842106, |
|
"eval_TIME_number": 34, |
|
"eval_TIME_precision": 0.7380952380952381, |
|
"eval_TIME_recall": 0.9117647058823529, |
|
"eval_loss": 0.1460731029510498, |
|
"eval_overall_accuracy": 0.9549593896135861, |
|
"eval_overall_f1": 0.7984395318595578, |
|
"eval_overall_precision": 0.7344497607655502, |
|
"eval_overall_recall": 0.8746438746438746, |
|
"eval_runtime": 0.3721, |
|
"eval_samples_per_second": 502.528, |
|
"eval_steps_per_second": 8.062, |
|
"step": 5088 |
|
}, |
|
{ |
|
"epoch": 49.0, |
|
"grad_norm": 0.42411187291145325, |
|
"learning_rate": 2.5500000000000003e-05, |
|
"loss": 0.0836, |
|
"step": 5194 |
|
}, |
|
{ |
|
"epoch": 49.0, |
|
"eval_LOCATION_f1": 0.7770700636942677, |
|
"eval_LOCATION_number": 73, |
|
"eval_LOCATION_precision": 0.7261904761904762, |
|
"eval_LOCATION_recall": 0.8356164383561644, |
|
"eval_ORGANIZATION_f1": 0.6838709677419356, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.5888888888888889, |
|
"eval_ORGANIZATION_recall": 0.8153846153846154, |
|
"eval_PERSON_f1": 0.8846153846153846, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8518518518518519, |
|
"eval_PERSON_recall": 0.92, |
|
"eval_QUANTITY_f1": 0.696969696969697, |
|
"eval_QUANTITY_number": 29, |
|
"eval_QUANTITY_precision": 0.6216216216216216, |
|
"eval_QUANTITY_recall": 0.7931034482758621, |
|
"eval_TIME_f1": 0.8, |
|
"eval_TIME_number": 34, |
|
"eval_TIME_precision": 0.7317073170731707, |
|
"eval_TIME_recall": 0.8823529411764706, |
|
"eval_loss": 0.14366112649440765, |
|
"eval_overall_accuracy": 0.9552055131676102, |
|
"eval_overall_f1": 0.7973856209150327, |
|
"eval_overall_precision": 0.7367149758454107, |
|
"eval_overall_recall": 0.8689458689458689, |
|
"eval_runtime": 0.3738, |
|
"eval_samples_per_second": 500.237, |
|
"eval_steps_per_second": 8.025, |
|
"step": 5194 |
|
}, |
|
{ |
|
"epoch": 50.0, |
|
"grad_norm": 1.5665122270584106, |
|
"learning_rate": 2.5e-05, |
|
"loss": 0.0845, |
|
"step": 5300 |
|
}, |
|
{ |
|
"epoch": 50.0, |
|
"eval_LOCATION_f1": 0.7770700636942677, |
|
"eval_LOCATION_number": 73, |
|
"eval_LOCATION_precision": 0.7261904761904762, |
|
"eval_LOCATION_recall": 0.8356164383561644, |
|
"eval_ORGANIZATION_f1": 0.7051282051282052, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6043956043956044, |
|
"eval_ORGANIZATION_recall": 0.8461538461538461, |
|
"eval_PERSON_f1": 0.8817891373801918, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8466257668711656, |
|
"eval_PERSON_recall": 0.92, |
|
"eval_QUANTITY_f1": 0.6666666666666667, |
|
"eval_QUANTITY_number": 29, |
|
"eval_QUANTITY_precision": 0.5945945945945946, |
|
"eval_QUANTITY_recall": 0.7586206896551724, |
|
"eval_TIME_f1": 0.8378378378378379, |
|
"eval_TIME_number": 34, |
|
"eval_TIME_precision": 0.775, |
|
"eval_TIME_recall": 0.9117647058823529, |
|
"eval_loss": 0.14279314875602722, |
|
"eval_overall_accuracy": 0.9552055131676102, |
|
"eval_overall_f1": 0.8015665796344648, |
|
"eval_overall_precision": 0.7397590361445783, |
|
"eval_overall_recall": 0.8746438746438746, |
|
"eval_runtime": 0.3776, |
|
"eval_samples_per_second": 495.202, |
|
"eval_steps_per_second": 7.944, |
|
"step": 5300 |
|
}, |
|
{ |
|
"epoch": 51.0, |
|
"grad_norm": 0.8180804252624512, |
|
"learning_rate": 2.45e-05, |
|
"loss": 0.0849, |
|
"step": 5406 |
|
}, |
|
{ |
|
"epoch": 51.0, |
|
"eval_LOCATION_f1": 0.7870967741935484, |
|
"eval_LOCATION_number": 73, |
|
"eval_LOCATION_precision": 0.7439024390243902, |
|
"eval_LOCATION_recall": 0.8356164383561644, |
|
"eval_ORGANIZATION_f1": 0.6973684210526315, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6091954022988506, |
|
"eval_ORGANIZATION_recall": 0.8153846153846154, |
|
"eval_PERSON_f1": 0.8817891373801918, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8466257668711656, |
|
"eval_PERSON_recall": 0.92, |
|
"eval_QUANTITY_f1": 0.6666666666666667, |
|
"eval_QUANTITY_number": 29, |
|
"eval_QUANTITY_precision": 0.5945945945945946, |
|
"eval_QUANTITY_recall": 0.7586206896551724, |
|
"eval_TIME_f1": 0.8378378378378379, |
|
"eval_TIME_number": 34, |
|
"eval_TIME_precision": 0.775, |
|
"eval_TIME_recall": 0.9117647058823529, |
|
"eval_loss": 0.1387655884027481, |
|
"eval_overall_accuracy": 0.9564361309377307, |
|
"eval_overall_f1": 0.8026315789473685, |
|
"eval_overall_precision": 0.7457212713936431, |
|
"eval_overall_recall": 0.8689458689458689, |
|
"eval_runtime": 0.377, |
|
"eval_samples_per_second": 496.079, |
|
"eval_steps_per_second": 7.958, |
|
"step": 5406 |
|
}, |
|
{ |
|
"epoch": 52.0, |
|
"grad_norm": 2.047976016998291, |
|
"learning_rate": 2.4e-05, |
|
"loss": 0.0836, |
|
"step": 5512 |
|
}, |
|
{ |
|
"epoch": 52.0, |
|
"eval_LOCATION_f1": 0.7672955974842768, |
|
"eval_LOCATION_number": 73, |
|
"eval_LOCATION_precision": 0.7093023255813954, |
|
"eval_LOCATION_recall": 0.8356164383561644, |
|
"eval_ORGANIZATION_f1": 0.7019867549668873, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6162790697674418, |
|
"eval_ORGANIZATION_recall": 0.8153846153846154, |
|
"eval_PERSON_f1": 0.8846153846153846, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8518518518518519, |
|
"eval_PERSON_recall": 0.92, |
|
"eval_QUANTITY_f1": 0.6865671641791046, |
|
"eval_QUANTITY_number": 29, |
|
"eval_QUANTITY_precision": 0.6052631578947368, |
|
"eval_QUANTITY_recall": 0.7931034482758621, |
|
"eval_TIME_f1": 0.8266666666666665, |
|
"eval_TIME_number": 34, |
|
"eval_TIME_precision": 0.7560975609756098, |
|
"eval_TIME_recall": 0.9117647058823529, |
|
"eval_loss": 0.14351429045200348, |
|
"eval_overall_accuracy": 0.9554516367216342, |
|
"eval_overall_f1": 0.8010471204188482, |
|
"eval_overall_precision": 0.7409200968523002, |
|
"eval_overall_recall": 0.8717948717948718, |
|
"eval_runtime": 0.3744, |
|
"eval_samples_per_second": 499.405, |
|
"eval_steps_per_second": 8.012, |
|
"step": 5512 |
|
}, |
|
{ |
|
"epoch": 53.0, |
|
"grad_norm": 1.9604336023330688, |
|
"learning_rate": 2.35e-05, |
|
"loss": 0.0838, |
|
"step": 5618 |
|
}, |
|
{ |
|
"epoch": 53.0, |
|
"eval_LOCATION_f1": 0.7625000000000001, |
|
"eval_LOCATION_number": 73, |
|
"eval_LOCATION_precision": 0.7011494252873564, |
|
"eval_LOCATION_recall": 0.8356164383561644, |
|
"eval_ORGANIZATION_f1": 0.6835443037974683, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.5806451612903226, |
|
"eval_ORGANIZATION_recall": 0.8307692307692308, |
|
"eval_PERSON_f1": 0.8789808917197452, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8414634146341463, |
|
"eval_PERSON_recall": 0.92, |
|
"eval_QUANTITY_f1": 0.6666666666666666, |
|
"eval_QUANTITY_number": 29, |
|
"eval_QUANTITY_precision": 0.575, |
|
"eval_QUANTITY_recall": 0.7931034482758621, |
|
"eval_TIME_f1": 0.8, |
|
"eval_TIME_number": 34, |
|
"eval_TIME_precision": 0.7317073170731707, |
|
"eval_TIME_recall": 0.8823529411764706, |
|
"eval_loss": 0.14942599833011627, |
|
"eval_overall_accuracy": 0.9527442776273689, |
|
"eval_overall_f1": 0.788659793814433, |
|
"eval_overall_precision": 0.72, |
|
"eval_overall_recall": 0.8717948717948718, |
|
"eval_runtime": 0.3783, |
|
"eval_samples_per_second": 494.359, |
|
"eval_steps_per_second": 7.931, |
|
"step": 5618 |
|
}, |
|
{ |
|
"epoch": 54.0, |
|
"grad_norm": 1.6018130779266357, |
|
"learning_rate": 2.3000000000000003e-05, |
|
"loss": 0.0811, |
|
"step": 5724 |
|
}, |
|
{ |
|
"epoch": 54.0, |
|
"eval_LOCATION_f1": 0.7654320987654321, |
|
"eval_LOCATION_number": 73, |
|
"eval_LOCATION_precision": 0.6966292134831461, |
|
"eval_LOCATION_recall": 0.8493150684931506, |
|
"eval_ORGANIZATION_f1": 0.6962025316455697, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.5913978494623656, |
|
"eval_ORGANIZATION_recall": 0.8461538461538461, |
|
"eval_PERSON_f1": 0.8817891373801918, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8466257668711656, |
|
"eval_PERSON_recall": 0.92, |
|
"eval_QUANTITY_f1": 0.7272727272727273, |
|
"eval_QUANTITY_number": 29, |
|
"eval_QUANTITY_precision": 0.6486486486486487, |
|
"eval_QUANTITY_recall": 0.8275862068965517, |
|
"eval_TIME_f1": 0.8266666666666665, |
|
"eval_TIME_number": 34, |
|
"eval_TIME_precision": 0.7560975609756098, |
|
"eval_TIME_recall": 0.9117647058823529, |
|
"eval_loss": 0.14617691934108734, |
|
"eval_overall_accuracy": 0.9556977602756583, |
|
"eval_overall_f1": 0.8010335917312662, |
|
"eval_overall_precision": 0.7328605200945626, |
|
"eval_overall_recall": 0.8831908831908832, |
|
"eval_runtime": 0.3727, |
|
"eval_samples_per_second": 501.802, |
|
"eval_steps_per_second": 8.05, |
|
"step": 5724 |
|
}, |
|
{ |
|
"epoch": 55.0, |
|
"grad_norm": 1.0216081142425537, |
|
"learning_rate": 2.25e-05, |
|
"loss": 0.0826, |
|
"step": 5830 |
|
}, |
|
{ |
|
"epoch": 55.0, |
|
"eval_LOCATION_f1": 0.7770700636942677, |
|
"eval_LOCATION_number": 73, |
|
"eval_LOCATION_precision": 0.7261904761904762, |
|
"eval_LOCATION_recall": 0.8356164383561644, |
|
"eval_ORGANIZATION_f1": 0.6666666666666666, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.5714285714285714, |
|
"eval_ORGANIZATION_recall": 0.8, |
|
"eval_PERSON_f1": 0.8817891373801918, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8466257668711656, |
|
"eval_PERSON_recall": 0.92, |
|
"eval_QUANTITY_f1": 0.6865671641791046, |
|
"eval_QUANTITY_number": 29, |
|
"eval_QUANTITY_precision": 0.6052631578947368, |
|
"eval_QUANTITY_recall": 0.7931034482758621, |
|
"eval_TIME_f1": 0.8266666666666665, |
|
"eval_TIME_number": 34, |
|
"eval_TIME_precision": 0.7560975609756098, |
|
"eval_TIME_recall": 0.9117647058823529, |
|
"eval_loss": 0.14629320800304413, |
|
"eval_overall_accuracy": 0.9534826482894413, |
|
"eval_overall_f1": 0.7942708333333333, |
|
"eval_overall_precision": 0.7314148681055156, |
|
"eval_overall_recall": 0.8689458689458689, |
|
"eval_runtime": 0.373, |
|
"eval_samples_per_second": 501.397, |
|
"eval_steps_per_second": 8.044, |
|
"step": 5830 |
|
}, |
|
{ |
|
"epoch": 56.0, |
|
"grad_norm": 1.5277239084243774, |
|
"learning_rate": 2.2000000000000003e-05, |
|
"loss": 0.0818, |
|
"step": 5936 |
|
}, |
|
{ |
|
"epoch": 56.0, |
|
"eval_LOCATION_f1": 0.7898089171974523, |
|
"eval_LOCATION_number": 73, |
|
"eval_LOCATION_precision": 0.7380952380952381, |
|
"eval_LOCATION_recall": 0.8493150684931506, |
|
"eval_ORGANIZATION_f1": 0.6794871794871795, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.5824175824175825, |
|
"eval_ORGANIZATION_recall": 0.8153846153846154, |
|
"eval_PERSON_f1": 0.8789808917197452, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8414634146341463, |
|
"eval_PERSON_recall": 0.92, |
|
"eval_QUANTITY_f1": 0.696969696969697, |
|
"eval_QUANTITY_number": 29, |
|
"eval_QUANTITY_precision": 0.6216216216216216, |
|
"eval_QUANTITY_recall": 0.7931034482758621, |
|
"eval_TIME_f1": 0.8378378378378379, |
|
"eval_TIME_number": 34, |
|
"eval_TIME_precision": 0.775, |
|
"eval_TIME_recall": 0.9117647058823529, |
|
"eval_loss": 0.14746278524398804, |
|
"eval_overall_accuracy": 0.9554516367216342, |
|
"eval_overall_f1": 0.8005215123859191, |
|
"eval_overall_precision": 0.7379807692307693, |
|
"eval_overall_recall": 0.8746438746438746, |
|
"eval_runtime": 0.3747, |
|
"eval_samples_per_second": 499.009, |
|
"eval_steps_per_second": 8.005, |
|
"step": 5936 |
|
}, |
|
{ |
|
"epoch": 57.0, |
|
"grad_norm": 1.1813913583755493, |
|
"learning_rate": 2.15e-05, |
|
"loss": 0.0833, |
|
"step": 6042 |
|
}, |
|
{ |
|
"epoch": 57.0, |
|
"eval_LOCATION_f1": 0.7692307692307693, |
|
"eval_LOCATION_number": 73, |
|
"eval_LOCATION_precision": 0.7228915662650602, |
|
"eval_LOCATION_recall": 0.821917808219178, |
|
"eval_ORGANIZATION_f1": 0.6792452830188681, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.574468085106383, |
|
"eval_ORGANIZATION_recall": 0.8307692307692308, |
|
"eval_PERSON_f1": 0.8734177215189873, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8313253012048193, |
|
"eval_PERSON_recall": 0.92, |
|
"eval_QUANTITY_f1": 0.6865671641791046, |
|
"eval_QUANTITY_number": 29, |
|
"eval_QUANTITY_precision": 0.6052631578947368, |
|
"eval_QUANTITY_recall": 0.7931034482758621, |
|
"eval_TIME_f1": 0.8266666666666665, |
|
"eval_TIME_number": 34, |
|
"eval_TIME_precision": 0.7560975609756098, |
|
"eval_TIME_recall": 0.9117647058823529, |
|
"eval_loss": 0.1485372930765152, |
|
"eval_overall_accuracy": 0.9529904011813931, |
|
"eval_overall_f1": 0.7917205692108668, |
|
"eval_overall_precision": 0.7251184834123223, |
|
"eval_overall_recall": 0.8717948717948718, |
|
"eval_runtime": 0.3727, |
|
"eval_samples_per_second": 501.711, |
|
"eval_steps_per_second": 8.049, |
|
"step": 6042 |
|
}, |
|
{ |
|
"epoch": 58.0, |
|
"grad_norm": 0.640755295753479, |
|
"learning_rate": 2.1e-05, |
|
"loss": 0.0798, |
|
"step": 6148 |
|
}, |
|
{ |
|
"epoch": 58.0, |
|
"eval_LOCATION_f1": 0.7692307692307693, |
|
"eval_LOCATION_number": 73, |
|
"eval_LOCATION_precision": 0.7228915662650602, |
|
"eval_LOCATION_recall": 0.821917808219178, |
|
"eval_ORGANIZATION_f1": 0.697986577181208, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6190476190476191, |
|
"eval_ORGANIZATION_recall": 0.8, |
|
"eval_PERSON_f1": 0.887459807073955, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8571428571428571, |
|
"eval_PERSON_recall": 0.92, |
|
"eval_QUANTITY_f1": 0.71875, |
|
"eval_QUANTITY_number": 29, |
|
"eval_QUANTITY_precision": 0.6571428571428571, |
|
"eval_QUANTITY_recall": 0.7931034482758621, |
|
"eval_TIME_f1": 0.8378378378378379, |
|
"eval_TIME_number": 34, |
|
"eval_TIME_precision": 0.775, |
|
"eval_TIME_recall": 0.9117647058823529, |
|
"eval_loss": 0.14086660742759705, |
|
"eval_overall_accuracy": 0.9564361309377307, |
|
"eval_overall_f1": 0.8063660477453581, |
|
"eval_overall_precision": 0.7543424317617866, |
|
"eval_overall_recall": 0.8660968660968661, |
|
"eval_runtime": 0.3766, |
|
"eval_samples_per_second": 496.571, |
|
"eval_steps_per_second": 7.966, |
|
"step": 6148 |
|
}, |
|
{ |
|
"epoch": 59.0, |
|
"grad_norm": 2.363363265991211, |
|
"learning_rate": 2.05e-05, |
|
"loss": 0.0802, |
|
"step": 6254 |
|
}, |
|
{ |
|
"epoch": 59.0, |
|
"eval_LOCATION_f1": 0.7770700636942677, |
|
"eval_LOCATION_number": 73, |
|
"eval_LOCATION_precision": 0.7261904761904762, |
|
"eval_LOCATION_recall": 0.8356164383561644, |
|
"eval_ORGANIZATION_f1": 0.6883116883116883, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.5955056179775281, |
|
"eval_ORGANIZATION_recall": 0.8153846153846154, |
|
"eval_PERSON_f1": 0.887459807073955, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8571428571428571, |
|
"eval_PERSON_recall": 0.92, |
|
"eval_QUANTITY_f1": 0.7076923076923076, |
|
"eval_QUANTITY_number": 29, |
|
"eval_QUANTITY_precision": 0.6388888888888888, |
|
"eval_QUANTITY_recall": 0.7931034482758621, |
|
"eval_TIME_f1": 0.8266666666666665, |
|
"eval_TIME_number": 34, |
|
"eval_TIME_precision": 0.7560975609756098, |
|
"eval_TIME_recall": 0.9117647058823529, |
|
"eval_loss": 0.14503292739391327, |
|
"eval_overall_accuracy": 0.9556977602756583, |
|
"eval_overall_f1": 0.8031496062992126, |
|
"eval_overall_precision": 0.7445255474452555, |
|
"eval_overall_recall": 0.8717948717948718, |
|
"eval_runtime": 0.374, |
|
"eval_samples_per_second": 499.944, |
|
"eval_steps_per_second": 8.02, |
|
"step": 6254 |
|
}, |
|
{ |
|
"epoch": 60.0, |
|
"grad_norm": 1.6086369752883911, |
|
"learning_rate": 2e-05, |
|
"loss": 0.08, |
|
"step": 6360 |
|
}, |
|
{ |
|
"epoch": 60.0, |
|
"eval_LOCATION_f1": 0.7999999999999999, |
|
"eval_LOCATION_number": 73, |
|
"eval_LOCATION_precision": 0.7560975609756098, |
|
"eval_LOCATION_recall": 0.8493150684931506, |
|
"eval_ORGANIZATION_f1": 0.7019867549668873, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6162790697674418, |
|
"eval_ORGANIZATION_recall": 0.8153846153846154, |
|
"eval_PERSON_f1": 0.887459807073955, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8571428571428571, |
|
"eval_PERSON_recall": 0.92, |
|
"eval_QUANTITY_f1": 0.6875, |
|
"eval_QUANTITY_number": 29, |
|
"eval_QUANTITY_precision": 0.6285714285714286, |
|
"eval_QUANTITY_recall": 0.7586206896551724, |
|
"eval_TIME_f1": 0.8533333333333334, |
|
"eval_TIME_number": 34, |
|
"eval_TIME_precision": 0.7804878048780488, |
|
"eval_TIME_recall": 0.9411764705882353, |
|
"eval_loss": 0.1365276426076889, |
|
"eval_overall_accuracy": 0.9591434900319961, |
|
"eval_overall_f1": 0.8121693121693121, |
|
"eval_overall_precision": 0.7580246913580246, |
|
"eval_overall_recall": 0.8746438746438746, |
|
"eval_runtime": 0.3728, |
|
"eval_samples_per_second": 501.578, |
|
"eval_steps_per_second": 8.047, |
|
"step": 6360 |
|
}, |
|
{ |
|
"epoch": 61.0, |
|
"grad_norm": 1.1481249332427979, |
|
"learning_rate": 1.9500000000000003e-05, |
|
"loss": 0.0792, |
|
"step": 6466 |
|
}, |
|
{ |
|
"epoch": 61.0, |
|
"eval_LOCATION_f1": 0.7692307692307693, |
|
"eval_LOCATION_number": 73, |
|
"eval_LOCATION_precision": 0.7228915662650602, |
|
"eval_LOCATION_recall": 0.821917808219178, |
|
"eval_ORGANIZATION_f1": 0.7152317880794703, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.627906976744186, |
|
"eval_ORGANIZATION_recall": 0.8307692307692308, |
|
"eval_PERSON_f1": 0.8846153846153846, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8518518518518519, |
|
"eval_PERSON_recall": 0.92, |
|
"eval_QUANTITY_f1": 0.6875, |
|
"eval_QUANTITY_number": 29, |
|
"eval_QUANTITY_precision": 0.6285714285714286, |
|
"eval_QUANTITY_recall": 0.7586206896551724, |
|
"eval_TIME_f1": 0.8533333333333334, |
|
"eval_TIME_number": 34, |
|
"eval_TIME_precision": 0.7804878048780488, |
|
"eval_TIME_recall": 0.9411764705882353, |
|
"eval_loss": 0.13838407397270203, |
|
"eval_overall_accuracy": 0.9576667487078513, |
|
"eval_overall_f1": 0.8073878627968336, |
|
"eval_overall_precision": 0.7518427518427518, |
|
"eval_overall_recall": 0.8717948717948718, |
|
"eval_runtime": 0.3773, |
|
"eval_samples_per_second": 495.651, |
|
"eval_steps_per_second": 7.952, |
|
"step": 6466 |
|
}, |
|
{ |
|
"epoch": 62.0, |
|
"grad_norm": 1.3433496952056885, |
|
"learning_rate": 1.9e-05, |
|
"loss": 0.0776, |
|
"step": 6572 |
|
}, |
|
{ |
|
"epoch": 62.0, |
|
"eval_LOCATION_f1": 0.7692307692307693, |
|
"eval_LOCATION_number": 73, |
|
"eval_LOCATION_precision": 0.7228915662650602, |
|
"eval_LOCATION_recall": 0.821917808219178, |
|
"eval_ORGANIZATION_f1": 0.7222222222222222, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6582278481012658, |
|
"eval_ORGANIZATION_recall": 0.8, |
|
"eval_PERSON_f1": 0.8846153846153846, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8518518518518519, |
|
"eval_PERSON_recall": 0.92, |
|
"eval_QUANTITY_f1": 0.696969696969697, |
|
"eval_QUANTITY_number": 29, |
|
"eval_QUANTITY_precision": 0.6216216216216216, |
|
"eval_QUANTITY_recall": 0.7931034482758621, |
|
"eval_TIME_f1": 0.8421052631578947, |
|
"eval_TIME_number": 34, |
|
"eval_TIME_precision": 0.7619047619047619, |
|
"eval_TIME_recall": 0.9411764705882353, |
|
"eval_loss": 0.14121700823307037, |
|
"eval_overall_accuracy": 0.9576667487078513, |
|
"eval_overall_f1": 0.8090185676392573, |
|
"eval_overall_precision": 0.7568238213399504, |
|
"eval_overall_recall": 0.8689458689458689, |
|
"eval_runtime": 0.3749, |
|
"eval_samples_per_second": 498.784, |
|
"eval_steps_per_second": 8.002, |
|
"step": 6572 |
|
}, |
|
{ |
|
"epoch": 63.0, |
|
"grad_norm": 2.4079196453094482, |
|
"learning_rate": 1.85e-05, |
|
"loss": 0.0782, |
|
"step": 6678 |
|
}, |
|
{ |
|
"epoch": 63.0, |
|
"eval_LOCATION_f1": 0.7770700636942677, |
|
"eval_LOCATION_number": 73, |
|
"eval_LOCATION_precision": 0.7261904761904762, |
|
"eval_LOCATION_recall": 0.8356164383561644, |
|
"eval_ORGANIZATION_f1": 0.6878980891719746, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.5869565217391305, |
|
"eval_ORGANIZATION_recall": 0.8307692307692308, |
|
"eval_PERSON_f1": 0.887459807073955, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8571428571428571, |
|
"eval_PERSON_recall": 0.92, |
|
"eval_QUANTITY_f1": 0.7076923076923076, |
|
"eval_QUANTITY_number": 29, |
|
"eval_QUANTITY_precision": 0.6388888888888888, |
|
"eval_QUANTITY_recall": 0.7931034482758621, |
|
"eval_TIME_f1": 0.8421052631578947, |
|
"eval_TIME_number": 34, |
|
"eval_TIME_precision": 0.7619047619047619, |
|
"eval_TIME_recall": 0.9411764705882353, |
|
"eval_loss": 0.1416482925415039, |
|
"eval_overall_accuracy": 0.9554516367216342, |
|
"eval_overall_f1": 0.804177545691906, |
|
"eval_overall_precision": 0.7421686746987952, |
|
"eval_overall_recall": 0.8774928774928775, |
|
"eval_runtime": 0.3756, |
|
"eval_samples_per_second": 497.871, |
|
"eval_steps_per_second": 7.987, |
|
"step": 6678 |
|
}, |
|
{ |
|
"epoch": 64.0, |
|
"grad_norm": 0.9945477247238159, |
|
"learning_rate": 1.8e-05, |
|
"loss": 0.0789, |
|
"step": 6784 |
|
}, |
|
{ |
|
"epoch": 64.0, |
|
"eval_LOCATION_f1": 0.7770700636942677, |
|
"eval_LOCATION_number": 73, |
|
"eval_LOCATION_precision": 0.7261904761904762, |
|
"eval_LOCATION_recall": 0.8356164383561644, |
|
"eval_ORGANIZATION_f1": 0.7123287671232877, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6419753086419753, |
|
"eval_ORGANIZATION_recall": 0.8, |
|
"eval_PERSON_f1": 0.887459807073955, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8571428571428571, |
|
"eval_PERSON_recall": 0.92, |
|
"eval_QUANTITY_f1": 0.6875, |
|
"eval_QUANTITY_number": 29, |
|
"eval_QUANTITY_precision": 0.6285714285714286, |
|
"eval_QUANTITY_recall": 0.7586206896551724, |
|
"eval_TIME_f1": 0.8421052631578947, |
|
"eval_TIME_number": 34, |
|
"eval_TIME_precision": 0.7619047619047619, |
|
"eval_TIME_recall": 0.9411764705882353, |
|
"eval_loss": 0.13378003239631653, |
|
"eval_overall_accuracy": 0.9581589958158996, |
|
"eval_overall_f1": 0.8090185676392573, |
|
"eval_overall_precision": 0.7568238213399504, |
|
"eval_overall_recall": 0.8689458689458689, |
|
"eval_runtime": 0.3716, |
|
"eval_samples_per_second": 503.164, |
|
"eval_steps_per_second": 8.072, |
|
"step": 6784 |
|
}, |
|
{ |
|
"epoch": 65.0, |
|
"grad_norm": 1.0777437686920166, |
|
"learning_rate": 1.75e-05, |
|
"loss": 0.0769, |
|
"step": 6890 |
|
}, |
|
{ |
|
"epoch": 65.0, |
|
"eval_LOCATION_f1": 0.7721518987341772, |
|
"eval_LOCATION_number": 73, |
|
"eval_LOCATION_precision": 0.7176470588235294, |
|
"eval_LOCATION_recall": 0.8356164383561644, |
|
"eval_ORGANIZATION_f1": 0.7123287671232877, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6419753086419753, |
|
"eval_ORGANIZATION_recall": 0.8, |
|
"eval_PERSON_f1": 0.887459807073955, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8571428571428571, |
|
"eval_PERSON_recall": 0.92, |
|
"eval_QUANTITY_f1": 0.7076923076923076, |
|
"eval_QUANTITY_number": 29, |
|
"eval_QUANTITY_precision": 0.6388888888888888, |
|
"eval_QUANTITY_recall": 0.7931034482758621, |
|
"eval_TIME_f1": 0.8266666666666665, |
|
"eval_TIME_number": 34, |
|
"eval_TIME_precision": 0.7560975609756098, |
|
"eval_TIME_recall": 0.9117647058823529, |
|
"eval_loss": 0.13960254192352295, |
|
"eval_overall_accuracy": 0.9579128722618755, |
|
"eval_overall_f1": 0.8079470198675496, |
|
"eval_overall_precision": 0.754950495049505, |
|
"eval_overall_recall": 0.8689458689458689, |
|
"eval_runtime": 0.3755, |
|
"eval_samples_per_second": 497.937, |
|
"eval_steps_per_second": 7.988, |
|
"step": 6890 |
|
}, |
|
{ |
|
"epoch": 66.0, |
|
"grad_norm": 0.8647677302360535, |
|
"learning_rate": 1.7000000000000003e-05, |
|
"loss": 0.0757, |
|
"step": 6996 |
|
}, |
|
{ |
|
"epoch": 66.0, |
|
"eval_LOCATION_f1": 0.7770700636942677, |
|
"eval_LOCATION_number": 73, |
|
"eval_LOCATION_precision": 0.7261904761904762, |
|
"eval_LOCATION_recall": 0.8356164383561644, |
|
"eval_ORGANIZATION_f1": 0.7019867549668873, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6162790697674418, |
|
"eval_ORGANIZATION_recall": 0.8153846153846154, |
|
"eval_PERSON_f1": 0.8846153846153846, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8518518518518519, |
|
"eval_PERSON_recall": 0.92, |
|
"eval_QUANTITY_f1": 0.676923076923077, |
|
"eval_QUANTITY_number": 29, |
|
"eval_QUANTITY_precision": 0.6111111111111112, |
|
"eval_QUANTITY_recall": 0.7586206896551724, |
|
"eval_TIME_f1": 0.8421052631578947, |
|
"eval_TIME_number": 34, |
|
"eval_TIME_precision": 0.7619047619047619, |
|
"eval_TIME_recall": 0.9411764705882353, |
|
"eval_loss": 0.1402267962694168, |
|
"eval_overall_accuracy": 0.9576667487078513, |
|
"eval_overall_f1": 0.8042049934296978, |
|
"eval_overall_precision": 0.7463414634146341, |
|
"eval_overall_recall": 0.8717948717948718, |
|
"eval_runtime": 0.3717, |
|
"eval_samples_per_second": 503.11, |
|
"eval_steps_per_second": 8.071, |
|
"step": 6996 |
|
}, |
|
{ |
|
"epoch": 67.0, |
|
"grad_norm": 1.0575724840164185, |
|
"learning_rate": 1.65e-05, |
|
"loss": 0.0753, |
|
"step": 7102 |
|
}, |
|
{ |
|
"epoch": 67.0, |
|
"eval_LOCATION_f1": 0.7820512820512822, |
|
"eval_LOCATION_number": 73, |
|
"eval_LOCATION_precision": 0.7349397590361446, |
|
"eval_LOCATION_recall": 0.8356164383561644, |
|
"eval_ORGANIZATION_f1": 0.7210884353741497, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6463414634146342, |
|
"eval_ORGANIZATION_recall": 0.8153846153846154, |
|
"eval_PERSON_f1": 0.887459807073955, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8571428571428571, |
|
"eval_PERSON_recall": 0.92, |
|
"eval_QUANTITY_f1": 0.7076923076923076, |
|
"eval_QUANTITY_number": 29, |
|
"eval_QUANTITY_precision": 0.6388888888888888, |
|
"eval_QUANTITY_recall": 0.7931034482758621, |
|
"eval_TIME_f1": 0.8533333333333334, |
|
"eval_TIME_number": 34, |
|
"eval_TIME_precision": 0.7804878048780488, |
|
"eval_TIME_recall": 0.9411764705882353, |
|
"eval_loss": 0.13897380232810974, |
|
"eval_overall_accuracy": 0.9593896135860202, |
|
"eval_overall_f1": 0.8143236074270558, |
|
"eval_overall_precision": 0.7617866004962779, |
|
"eval_overall_recall": 0.8746438746438746, |
|
"eval_runtime": 0.3722, |
|
"eval_samples_per_second": 502.482, |
|
"eval_steps_per_second": 8.061, |
|
"step": 7102 |
|
}, |
|
{ |
|
"epoch": 68.0, |
|
"grad_norm": 0.9653581976890564, |
|
"learning_rate": 1.6000000000000003e-05, |
|
"loss": 0.0757, |
|
"step": 7208 |
|
}, |
|
{ |
|
"epoch": 68.0, |
|
"eval_LOCATION_f1": 0.7870967741935484, |
|
"eval_LOCATION_number": 73, |
|
"eval_LOCATION_precision": 0.7439024390243902, |
|
"eval_LOCATION_recall": 0.8356164383561644, |
|
"eval_ORGANIZATION_f1": 0.7172413793103448, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.65, |
|
"eval_ORGANIZATION_recall": 0.8, |
|
"eval_PERSON_f1": 0.887459807073955, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8571428571428571, |
|
"eval_PERSON_recall": 0.92, |
|
"eval_QUANTITY_f1": 0.7076923076923076, |
|
"eval_QUANTITY_number": 29, |
|
"eval_QUANTITY_precision": 0.6388888888888888, |
|
"eval_QUANTITY_recall": 0.7931034482758621, |
|
"eval_TIME_f1": 0.8533333333333334, |
|
"eval_TIME_number": 34, |
|
"eval_TIME_precision": 0.7804878048780488, |
|
"eval_TIME_recall": 0.9411764705882353, |
|
"eval_loss": 0.13793830573558807, |
|
"eval_overall_accuracy": 0.9591434900319961, |
|
"eval_overall_f1": 0.8149134487350199, |
|
"eval_overall_precision": 0.765, |
|
"eval_overall_recall": 0.8717948717948718, |
|
"eval_runtime": 0.3738, |
|
"eval_samples_per_second": 500.215, |
|
"eval_steps_per_second": 8.025, |
|
"step": 7208 |
|
}, |
|
{ |
|
"epoch": 69.0, |
|
"grad_norm": 1.3589030504226685, |
|
"learning_rate": 1.55e-05, |
|
"loss": 0.0731, |
|
"step": 7314 |
|
}, |
|
{ |
|
"epoch": 69.0, |
|
"eval_LOCATION_f1": 0.7770700636942677, |
|
"eval_LOCATION_number": 73, |
|
"eval_LOCATION_precision": 0.7261904761904762, |
|
"eval_LOCATION_recall": 0.8356164383561644, |
|
"eval_ORGANIZATION_f1": 0.7320261437908497, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6363636363636364, |
|
"eval_ORGANIZATION_recall": 0.8615384615384616, |
|
"eval_PERSON_f1": 0.887459807073955, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8571428571428571, |
|
"eval_PERSON_recall": 0.92, |
|
"eval_QUANTITY_f1": 0.71875, |
|
"eval_QUANTITY_number": 29, |
|
"eval_QUANTITY_precision": 0.6571428571428571, |
|
"eval_QUANTITY_recall": 0.7931034482758621, |
|
"eval_TIME_f1": 0.8533333333333334, |
|
"eval_TIME_number": 34, |
|
"eval_TIME_precision": 0.7804878048780488, |
|
"eval_TIME_recall": 0.9411764705882353, |
|
"eval_loss": 0.14166338741779327, |
|
"eval_overall_accuracy": 0.9581589958158996, |
|
"eval_overall_f1": 0.8157894736842105, |
|
"eval_overall_precision": 0.7579462102689487, |
|
"eval_overall_recall": 0.8831908831908832, |
|
"eval_runtime": 0.3735, |
|
"eval_samples_per_second": 500.684, |
|
"eval_steps_per_second": 8.032, |
|
"step": 7314 |
|
}, |
|
{ |
|
"epoch": 70.0, |
|
"grad_norm": 1.4494452476501465, |
|
"learning_rate": 1.5e-05, |
|
"loss": 0.0751, |
|
"step": 7420 |
|
}, |
|
{ |
|
"epoch": 70.0, |
|
"eval_LOCATION_f1": 0.7870967741935484, |
|
"eval_LOCATION_number": 73, |
|
"eval_LOCATION_precision": 0.7439024390243902, |
|
"eval_LOCATION_recall": 0.8356164383561644, |
|
"eval_ORGANIZATION_f1": 0.7172413793103448, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.65, |
|
"eval_ORGANIZATION_recall": 0.8, |
|
"eval_PERSON_f1": 0.8903225806451613, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8625, |
|
"eval_PERSON_recall": 0.92, |
|
"eval_QUANTITY_f1": 0.6875, |
|
"eval_QUANTITY_number": 29, |
|
"eval_QUANTITY_precision": 0.6285714285714286, |
|
"eval_QUANTITY_recall": 0.7586206896551724, |
|
"eval_TIME_f1": 0.8533333333333334, |
|
"eval_TIME_number": 34, |
|
"eval_TIME_precision": 0.7804878048780488, |
|
"eval_TIME_recall": 0.9411764705882353, |
|
"eval_loss": 0.13516362011432648, |
|
"eval_overall_accuracy": 0.9591434900319961, |
|
"eval_overall_f1": 0.814419225634179, |
|
"eval_overall_precision": 0.7663316582914573, |
|
"eval_overall_recall": 0.8689458689458689, |
|
"eval_runtime": 0.3728, |
|
"eval_samples_per_second": 501.549, |
|
"eval_steps_per_second": 8.046, |
|
"step": 7420 |
|
}, |
|
{ |
|
"epoch": 71.0, |
|
"grad_norm": 2.012171745300293, |
|
"learning_rate": 1.45e-05, |
|
"loss": 0.0755, |
|
"step": 7526 |
|
}, |
|
{ |
|
"epoch": 71.0, |
|
"eval_LOCATION_f1": 0.7820512820512822, |
|
"eval_LOCATION_number": 73, |
|
"eval_LOCATION_precision": 0.7349397590361446, |
|
"eval_LOCATION_recall": 0.8356164383561644, |
|
"eval_ORGANIZATION_f1": 0.7189542483660131, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.625, |
|
"eval_ORGANIZATION_recall": 0.8461538461538461, |
|
"eval_PERSON_f1": 0.8846153846153846, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8518518518518519, |
|
"eval_PERSON_recall": 0.92, |
|
"eval_QUANTITY_f1": 0.696969696969697, |
|
"eval_QUANTITY_number": 29, |
|
"eval_QUANTITY_precision": 0.6216216216216216, |
|
"eval_QUANTITY_recall": 0.7931034482758621, |
|
"eval_TIME_f1": 0.8421052631578947, |
|
"eval_TIME_number": 34, |
|
"eval_TIME_precision": 0.7619047619047619, |
|
"eval_TIME_recall": 0.9411764705882353, |
|
"eval_loss": 0.14387430250644684, |
|
"eval_overall_accuracy": 0.9576667487078513, |
|
"eval_overall_f1": 0.8099606815203145, |
|
"eval_overall_precision": 0.75, |
|
"eval_overall_recall": 0.8803418803418803, |
|
"eval_runtime": 0.3724, |
|
"eval_samples_per_second": 502.104, |
|
"eval_steps_per_second": 8.055, |
|
"step": 7526 |
|
}, |
|
{ |
|
"epoch": 72.0, |
|
"grad_norm": 1.370118498802185, |
|
"learning_rate": 1.4000000000000001e-05, |
|
"loss": 0.0745, |
|
"step": 7632 |
|
}, |
|
{ |
|
"epoch": 72.0, |
|
"eval_LOCATION_f1": 0.7770700636942677, |
|
"eval_LOCATION_number": 73, |
|
"eval_LOCATION_precision": 0.7261904761904762, |
|
"eval_LOCATION_recall": 0.8356164383561644, |
|
"eval_ORGANIZATION_f1": 0.7123287671232877, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6419753086419753, |
|
"eval_ORGANIZATION_recall": 0.8, |
|
"eval_PERSON_f1": 0.8846153846153846, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8518518518518519, |
|
"eval_PERSON_recall": 0.92, |
|
"eval_QUANTITY_f1": 0.676923076923077, |
|
"eval_QUANTITY_number": 29, |
|
"eval_QUANTITY_precision": 0.6111111111111112, |
|
"eval_QUANTITY_recall": 0.7586206896551724, |
|
"eval_TIME_f1": 0.8421052631578947, |
|
"eval_TIME_number": 34, |
|
"eval_TIME_precision": 0.7619047619047619, |
|
"eval_TIME_recall": 0.9411764705882353, |
|
"eval_loss": 0.13974949717521667, |
|
"eval_overall_accuracy": 0.9579128722618755, |
|
"eval_overall_f1": 0.8068783068783069, |
|
"eval_overall_precision": 0.7530864197530864, |
|
"eval_overall_recall": 0.8689458689458689, |
|
"eval_runtime": 0.3737, |
|
"eval_samples_per_second": 500.351, |
|
"eval_steps_per_second": 8.027, |
|
"step": 7632 |
|
}, |
|
{ |
|
"epoch": 73.0, |
|
"grad_norm": 0.621573805809021, |
|
"learning_rate": 1.3500000000000001e-05, |
|
"loss": 0.0746, |
|
"step": 7738 |
|
}, |
|
{ |
|
"epoch": 73.0, |
|
"eval_LOCATION_f1": 0.7792207792207793, |
|
"eval_LOCATION_number": 73, |
|
"eval_LOCATION_precision": 0.7407407407407407, |
|
"eval_LOCATION_recall": 0.821917808219178, |
|
"eval_ORGANIZATION_f1": 0.7172413793103448, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.65, |
|
"eval_ORGANIZATION_recall": 0.8, |
|
"eval_PERSON_f1": 0.887459807073955, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8571428571428571, |
|
"eval_PERSON_recall": 0.92, |
|
"eval_QUANTITY_f1": 0.7076923076923076, |
|
"eval_QUANTITY_number": 29, |
|
"eval_QUANTITY_precision": 0.6388888888888888, |
|
"eval_QUANTITY_recall": 0.7931034482758621, |
|
"eval_TIME_f1": 0.8533333333333334, |
|
"eval_TIME_number": 34, |
|
"eval_TIME_precision": 0.7804878048780488, |
|
"eval_TIME_recall": 0.9411764705882353, |
|
"eval_loss": 0.1360926479101181, |
|
"eval_overall_accuracy": 0.9591434900319961, |
|
"eval_overall_f1": 0.8133333333333332, |
|
"eval_overall_precision": 0.7644110275689223, |
|
"eval_overall_recall": 0.8689458689458689, |
|
"eval_runtime": 0.3745, |
|
"eval_samples_per_second": 499.381, |
|
"eval_steps_per_second": 8.011, |
|
"step": 7738 |
|
}, |
|
{ |
|
"epoch": 74.0, |
|
"grad_norm": 1.1147890090942383, |
|
"learning_rate": 1.3000000000000001e-05, |
|
"loss": 0.0727, |
|
"step": 7844 |
|
}, |
|
{ |
|
"epoch": 74.0, |
|
"eval_LOCATION_f1": 0.7870967741935484, |
|
"eval_LOCATION_number": 73, |
|
"eval_LOCATION_precision": 0.7439024390243902, |
|
"eval_LOCATION_recall": 0.8356164383561644, |
|
"eval_ORGANIZATION_f1": 0.7172413793103448, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.65, |
|
"eval_ORGANIZATION_recall": 0.8, |
|
"eval_PERSON_f1": 0.887459807073955, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8571428571428571, |
|
"eval_PERSON_recall": 0.92, |
|
"eval_QUANTITY_f1": 0.6875, |
|
"eval_QUANTITY_number": 29, |
|
"eval_QUANTITY_precision": 0.6285714285714286, |
|
"eval_QUANTITY_recall": 0.7586206896551724, |
|
"eval_TIME_f1": 0.8533333333333334, |
|
"eval_TIME_number": 34, |
|
"eval_TIME_precision": 0.7804878048780488, |
|
"eval_TIME_recall": 0.9411764705882353, |
|
"eval_loss": 0.13560639321804047, |
|
"eval_overall_accuracy": 0.9596357371400444, |
|
"eval_overall_f1": 0.8133333333333332, |
|
"eval_overall_precision": 0.7644110275689223, |
|
"eval_overall_recall": 0.8689458689458689, |
|
"eval_runtime": 0.374, |
|
"eval_samples_per_second": 500.038, |
|
"eval_steps_per_second": 8.022, |
|
"step": 7844 |
|
}, |
|
{ |
|
"epoch": 75.0, |
|
"grad_norm": 0.9206987619400024, |
|
"learning_rate": 1.25e-05, |
|
"loss": 0.0727, |
|
"step": 7950 |
|
}, |
|
{ |
|
"epoch": 75.0, |
|
"eval_LOCATION_f1": 0.7770700636942677, |
|
"eval_LOCATION_number": 73, |
|
"eval_LOCATION_precision": 0.7261904761904762, |
|
"eval_LOCATION_recall": 0.8356164383561644, |
|
"eval_ORGANIZATION_f1": 0.7162162162162162, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6385542168674698, |
|
"eval_ORGANIZATION_recall": 0.8153846153846154, |
|
"eval_PERSON_f1": 0.887459807073955, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8571428571428571, |
|
"eval_PERSON_recall": 0.92, |
|
"eval_QUANTITY_f1": 0.7076923076923076, |
|
"eval_QUANTITY_number": 29, |
|
"eval_QUANTITY_precision": 0.6388888888888888, |
|
"eval_QUANTITY_recall": 0.7931034482758621, |
|
"eval_TIME_f1": 0.8421052631578947, |
|
"eval_TIME_number": 34, |
|
"eval_TIME_precision": 0.7619047619047619, |
|
"eval_TIME_recall": 0.9411764705882353, |
|
"eval_loss": 0.14432945847511292, |
|
"eval_overall_accuracy": 0.9574206251538272, |
|
"eval_overall_f1": 0.8110964332892999, |
|
"eval_overall_precision": 0.7561576354679803, |
|
"eval_overall_recall": 0.8746438746438746, |
|
"eval_runtime": 0.374, |
|
"eval_samples_per_second": 499.951, |
|
"eval_steps_per_second": 8.021, |
|
"step": 7950 |
|
}, |
|
{ |
|
"epoch": 76.0, |
|
"grad_norm": 1.3934582471847534, |
|
"learning_rate": 1.2e-05, |
|
"loss": 0.073, |
|
"step": 8056 |
|
}, |
|
{ |
|
"epoch": 76.0, |
|
"eval_LOCATION_f1": 0.7770700636942677, |
|
"eval_LOCATION_number": 73, |
|
"eval_LOCATION_precision": 0.7261904761904762, |
|
"eval_LOCATION_recall": 0.8356164383561644, |
|
"eval_ORGANIZATION_f1": 0.7012987012987013, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6067415730337079, |
|
"eval_ORGANIZATION_recall": 0.8307692307692308, |
|
"eval_PERSON_f1": 0.887459807073955, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8571428571428571, |
|
"eval_PERSON_recall": 0.92, |
|
"eval_QUANTITY_f1": 0.6875, |
|
"eval_QUANTITY_number": 29, |
|
"eval_QUANTITY_precision": 0.6285714285714286, |
|
"eval_QUANTITY_recall": 0.7586206896551724, |
|
"eval_TIME_f1": 0.8, |
|
"eval_TIME_number": 34, |
|
"eval_TIME_precision": 0.7317073170731707, |
|
"eval_TIME_recall": 0.8823529411764706, |
|
"eval_loss": 0.14394371211528778, |
|
"eval_overall_accuracy": 0.9549593896135861, |
|
"eval_overall_f1": 0.8015768725361366, |
|
"eval_overall_precision": 0.7439024390243902, |
|
"eval_overall_recall": 0.8689458689458689, |
|
"eval_runtime": 0.3764, |
|
"eval_samples_per_second": 496.875, |
|
"eval_steps_per_second": 7.971, |
|
"step": 8056 |
|
}, |
|
{ |
|
"epoch": 77.0, |
|
"grad_norm": 1.3345227241516113, |
|
"learning_rate": 1.1500000000000002e-05, |
|
"loss": 0.0733, |
|
"step": 8162 |
|
}, |
|
{ |
|
"epoch": 77.0, |
|
"eval_LOCATION_f1": 0.7792207792207793, |
|
"eval_LOCATION_number": 73, |
|
"eval_LOCATION_precision": 0.7407407407407407, |
|
"eval_LOCATION_recall": 0.821917808219178, |
|
"eval_ORGANIZATION_f1": 0.7310344827586207, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6625, |
|
"eval_ORGANIZATION_recall": 0.8153846153846154, |
|
"eval_PERSON_f1": 0.887459807073955, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8571428571428571, |
|
"eval_PERSON_recall": 0.92, |
|
"eval_QUANTITY_f1": 0.6875, |
|
"eval_QUANTITY_number": 29, |
|
"eval_QUANTITY_precision": 0.6285714285714286, |
|
"eval_QUANTITY_recall": 0.7586206896551724, |
|
"eval_TIME_f1": 0.8266666666666665, |
|
"eval_TIME_number": 34, |
|
"eval_TIME_precision": 0.7560975609756098, |
|
"eval_TIME_recall": 0.9117647058823529, |
|
"eval_loss": 0.13728104531764984, |
|
"eval_overall_accuracy": 0.9593896135860202, |
|
"eval_overall_f1": 0.8117489986648865, |
|
"eval_overall_precision": 0.7638190954773869, |
|
"eval_overall_recall": 0.8660968660968661, |
|
"eval_runtime": 0.3706, |
|
"eval_samples_per_second": 504.552, |
|
"eval_steps_per_second": 8.094, |
|
"step": 8162 |
|
}, |
|
{ |
|
"epoch": 78.0, |
|
"grad_norm": 1.4736689329147339, |
|
"learning_rate": 1.1000000000000001e-05, |
|
"loss": 0.072, |
|
"step": 8268 |
|
}, |
|
{ |
|
"epoch": 78.0, |
|
"eval_LOCATION_f1": 0.7870967741935484, |
|
"eval_LOCATION_number": 73, |
|
"eval_LOCATION_precision": 0.7439024390243902, |
|
"eval_LOCATION_recall": 0.8356164383561644, |
|
"eval_ORGANIZATION_f1": 0.726027397260274, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.654320987654321, |
|
"eval_ORGANIZATION_recall": 0.8153846153846154, |
|
"eval_PERSON_f1": 0.887459807073955, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8571428571428571, |
|
"eval_PERSON_recall": 0.92, |
|
"eval_QUANTITY_f1": 0.7076923076923076, |
|
"eval_QUANTITY_number": 29, |
|
"eval_QUANTITY_precision": 0.6388888888888888, |
|
"eval_QUANTITY_recall": 0.7931034482758621, |
|
"eval_TIME_f1": 0.8421052631578947, |
|
"eval_TIME_number": 34, |
|
"eval_TIME_precision": 0.7619047619047619, |
|
"eval_TIME_recall": 0.9411764705882353, |
|
"eval_loss": 0.14146719872951508, |
|
"eval_overall_accuracy": 0.9581589958158996, |
|
"eval_overall_f1": 0.8154050464807436, |
|
"eval_overall_precision": 0.763681592039801, |
|
"eval_overall_recall": 0.8746438746438746, |
|
"eval_runtime": 0.3724, |
|
"eval_samples_per_second": 502.127, |
|
"eval_steps_per_second": 8.056, |
|
"step": 8268 |
|
}, |
|
{ |
|
"epoch": 79.0, |
|
"grad_norm": 0.9665191769599915, |
|
"learning_rate": 1.05e-05, |
|
"loss": 0.0718, |
|
"step": 8374 |
|
}, |
|
{ |
|
"epoch": 79.0, |
|
"eval_LOCATION_f1": 0.7721518987341772, |
|
"eval_LOCATION_number": 73, |
|
"eval_LOCATION_precision": 0.7176470588235294, |
|
"eval_LOCATION_recall": 0.8356164383561644, |
|
"eval_ORGANIZATION_f1": 0.717948717948718, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6153846153846154, |
|
"eval_ORGANIZATION_recall": 0.8615384615384616, |
|
"eval_PERSON_f1": 0.8817891373801918, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8466257668711656, |
|
"eval_PERSON_recall": 0.92, |
|
"eval_QUANTITY_f1": 0.7076923076923076, |
|
"eval_QUANTITY_number": 29, |
|
"eval_QUANTITY_precision": 0.6388888888888888, |
|
"eval_QUANTITY_recall": 0.7931034482758621, |
|
"eval_TIME_f1": 0.8, |
|
"eval_TIME_number": 34, |
|
"eval_TIME_precision": 0.7317073170731707, |
|
"eval_TIME_recall": 0.8823529411764706, |
|
"eval_loss": 0.14953278005123138, |
|
"eval_overall_accuracy": 0.9552055131676102, |
|
"eval_overall_f1": 0.8031290743155151, |
|
"eval_overall_precision": 0.7403846153846154, |
|
"eval_overall_recall": 0.8774928774928775, |
|
"eval_runtime": 0.3713, |
|
"eval_samples_per_second": 503.668, |
|
"eval_steps_per_second": 8.08, |
|
"step": 8374 |
|
}, |
|
{ |
|
"epoch": 80.0, |
|
"grad_norm": 0.4756767153739929, |
|
"learning_rate": 1e-05, |
|
"loss": 0.0703, |
|
"step": 8480 |
|
}, |
|
{ |
|
"epoch": 80.0, |
|
"eval_LOCATION_f1": 0.7820512820512822, |
|
"eval_LOCATION_number": 73, |
|
"eval_LOCATION_precision": 0.7349397590361446, |
|
"eval_LOCATION_recall": 0.8356164383561644, |
|
"eval_ORGANIZATION_f1": 0.7432432432432433, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6626506024096386, |
|
"eval_ORGANIZATION_recall": 0.8461538461538461, |
|
"eval_PERSON_f1": 0.8817891373801918, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8466257668711656, |
|
"eval_PERSON_recall": 0.92, |
|
"eval_QUANTITY_f1": 0.7076923076923076, |
|
"eval_QUANTITY_number": 29, |
|
"eval_QUANTITY_precision": 0.6388888888888888, |
|
"eval_QUANTITY_recall": 0.7931034482758621, |
|
"eval_TIME_f1": 0.8, |
|
"eval_TIME_number": 34, |
|
"eval_TIME_precision": 0.7317073170731707, |
|
"eval_TIME_recall": 0.8823529411764706, |
|
"eval_loss": 0.14299984276294708, |
|
"eval_overall_accuracy": 0.9571745015998031, |
|
"eval_overall_f1": 0.8110964332892999, |
|
"eval_overall_precision": 0.7561576354679803, |
|
"eval_overall_recall": 0.8746438746438746, |
|
"eval_runtime": 0.3781, |
|
"eval_samples_per_second": 494.608, |
|
"eval_steps_per_second": 7.935, |
|
"step": 8480 |
|
}, |
|
{ |
|
"epoch": 81.0, |
|
"grad_norm": 0.7018587589263916, |
|
"learning_rate": 9.5e-06, |
|
"loss": 0.0702, |
|
"step": 8586 |
|
}, |
|
{ |
|
"epoch": 81.0, |
|
"eval_LOCATION_f1": 0.7820512820512822, |
|
"eval_LOCATION_number": 73, |
|
"eval_LOCATION_precision": 0.7349397590361446, |
|
"eval_LOCATION_recall": 0.8356164383561644, |
|
"eval_ORGANIZATION_f1": 0.7432432432432433, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6626506024096386, |
|
"eval_ORGANIZATION_recall": 0.8461538461538461, |
|
"eval_PERSON_f1": 0.887459807073955, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8571428571428571, |
|
"eval_PERSON_recall": 0.92, |
|
"eval_QUANTITY_f1": 0.71875, |
|
"eval_QUANTITY_number": 29, |
|
"eval_QUANTITY_precision": 0.6571428571428571, |
|
"eval_QUANTITY_recall": 0.7931034482758621, |
|
"eval_TIME_f1": 0.8, |
|
"eval_TIME_number": 34, |
|
"eval_TIME_precision": 0.7317073170731707, |
|
"eval_TIME_recall": 0.8823529411764706, |
|
"eval_loss": 0.14150598645210266, |
|
"eval_overall_accuracy": 0.9584051193699237, |
|
"eval_overall_f1": 0.8143236074270558, |
|
"eval_overall_precision": 0.7617866004962779, |
|
"eval_overall_recall": 0.8746438746438746, |
|
"eval_runtime": 0.3737, |
|
"eval_samples_per_second": 500.383, |
|
"eval_steps_per_second": 8.028, |
|
"step": 8586 |
|
}, |
|
{ |
|
"epoch": 82.0, |
|
"grad_norm": 1.6355091333389282, |
|
"learning_rate": 9e-06, |
|
"loss": 0.0721, |
|
"step": 8692 |
|
}, |
|
{ |
|
"epoch": 82.0, |
|
"eval_LOCATION_f1": 0.7820512820512822, |
|
"eval_LOCATION_number": 73, |
|
"eval_LOCATION_precision": 0.7349397590361446, |
|
"eval_LOCATION_recall": 0.8356164383561644, |
|
"eval_ORGANIZATION_f1": 0.7432432432432433, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6626506024096386, |
|
"eval_ORGANIZATION_recall": 0.8461538461538461, |
|
"eval_PERSON_f1": 0.887459807073955, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8571428571428571, |
|
"eval_PERSON_recall": 0.92, |
|
"eval_QUANTITY_f1": 0.71875, |
|
"eval_QUANTITY_number": 29, |
|
"eval_QUANTITY_precision": 0.6571428571428571, |
|
"eval_QUANTITY_recall": 0.7931034482758621, |
|
"eval_TIME_f1": 0.8266666666666665, |
|
"eval_TIME_number": 34, |
|
"eval_TIME_precision": 0.7560975609756098, |
|
"eval_TIME_recall": 0.9117647058823529, |
|
"eval_loss": 0.14245130121707916, |
|
"eval_overall_accuracy": 0.958897366477972, |
|
"eval_overall_f1": 0.8169761273209548, |
|
"eval_overall_precision": 0.7642679900744417, |
|
"eval_overall_recall": 0.8774928774928775, |
|
"eval_runtime": 0.3741, |
|
"eval_samples_per_second": 499.836, |
|
"eval_steps_per_second": 8.019, |
|
"step": 8692 |
|
}, |
|
{ |
|
"epoch": 83.0, |
|
"grad_norm": 0.8933713436126709, |
|
"learning_rate": 8.500000000000002e-06, |
|
"loss": 0.0712, |
|
"step": 8798 |
|
}, |
|
{ |
|
"epoch": 83.0, |
|
"eval_LOCATION_f1": 0.7770700636942677, |
|
"eval_LOCATION_number": 73, |
|
"eval_LOCATION_precision": 0.7261904761904762, |
|
"eval_LOCATION_recall": 0.8356164383561644, |
|
"eval_ORGANIZATION_f1": 0.7432432432432433, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6626506024096386, |
|
"eval_ORGANIZATION_recall": 0.8461538461538461, |
|
"eval_PERSON_f1": 0.887459807073955, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8571428571428571, |
|
"eval_PERSON_recall": 0.92, |
|
"eval_QUANTITY_f1": 0.71875, |
|
"eval_QUANTITY_number": 29, |
|
"eval_QUANTITY_precision": 0.6571428571428571, |
|
"eval_QUANTITY_recall": 0.7931034482758621, |
|
"eval_TIME_f1": 0.8421052631578947, |
|
"eval_TIME_number": 34, |
|
"eval_TIME_precision": 0.7619047619047619, |
|
"eval_TIME_recall": 0.9411764705882353, |
|
"eval_loss": 0.1438244879245758, |
|
"eval_overall_accuracy": 0.9586512429239479, |
|
"eval_overall_f1": 0.8174603174603174, |
|
"eval_overall_precision": 0.762962962962963, |
|
"eval_overall_recall": 0.8803418803418803, |
|
"eval_runtime": 0.3755, |
|
"eval_samples_per_second": 498.003, |
|
"eval_steps_per_second": 7.989, |
|
"step": 8798 |
|
}, |
|
{ |
|
"epoch": 84.0, |
|
"grad_norm": 1.0442496538162231, |
|
"learning_rate": 8.000000000000001e-06, |
|
"loss": 0.0719, |
|
"step": 8904 |
|
}, |
|
{ |
|
"epoch": 84.0, |
|
"eval_LOCATION_f1": 0.7770700636942677, |
|
"eval_LOCATION_number": 73, |
|
"eval_LOCATION_precision": 0.7261904761904762, |
|
"eval_LOCATION_recall": 0.8356164383561644, |
|
"eval_ORGANIZATION_f1": 0.738255033557047, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6547619047619048, |
|
"eval_ORGANIZATION_recall": 0.8461538461538461, |
|
"eval_PERSON_f1": 0.887459807073955, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8571428571428571, |
|
"eval_PERSON_recall": 0.92, |
|
"eval_QUANTITY_f1": 0.7076923076923076, |
|
"eval_QUANTITY_number": 29, |
|
"eval_QUANTITY_precision": 0.6388888888888888, |
|
"eval_QUANTITY_recall": 0.7931034482758621, |
|
"eval_TIME_f1": 0.8421052631578947, |
|
"eval_TIME_number": 34, |
|
"eval_TIME_precision": 0.7619047619047619, |
|
"eval_TIME_recall": 0.9411764705882353, |
|
"eval_loss": 0.1436508744955063, |
|
"eval_overall_accuracy": 0.9579128722618755, |
|
"eval_overall_f1": 0.8153034300791556, |
|
"eval_overall_precision": 0.7592137592137592, |
|
"eval_overall_recall": 0.8803418803418803, |
|
"eval_runtime": 0.3727, |
|
"eval_samples_per_second": 501.681, |
|
"eval_steps_per_second": 8.048, |
|
"step": 8904 |
|
}, |
|
{ |
|
"epoch": 85.0, |
|
"grad_norm": 1.8608384132385254, |
|
"learning_rate": 7.5e-06, |
|
"loss": 0.0709, |
|
"step": 9010 |
|
}, |
|
{ |
|
"epoch": 85.0, |
|
"eval_LOCATION_f1": 0.7770700636942677, |
|
"eval_LOCATION_number": 73, |
|
"eval_LOCATION_precision": 0.7261904761904762, |
|
"eval_LOCATION_recall": 0.8356164383561644, |
|
"eval_ORGANIZATION_f1": 0.7297297297297298, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6506024096385542, |
|
"eval_ORGANIZATION_recall": 0.8307692307692308, |
|
"eval_PERSON_f1": 0.887459807073955, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8571428571428571, |
|
"eval_PERSON_recall": 0.92, |
|
"eval_QUANTITY_f1": 0.7076923076923076, |
|
"eval_QUANTITY_number": 29, |
|
"eval_QUANTITY_precision": 0.6388888888888888, |
|
"eval_QUANTITY_recall": 0.7931034482758621, |
|
"eval_TIME_f1": 0.8, |
|
"eval_TIME_number": 34, |
|
"eval_TIME_precision": 0.7317073170731707, |
|
"eval_TIME_recall": 0.8823529411764706, |
|
"eval_loss": 0.14415280520915985, |
|
"eval_overall_accuracy": 0.9574206251538272, |
|
"eval_overall_f1": 0.8095238095238095, |
|
"eval_overall_precision": 0.7555555555555555, |
|
"eval_overall_recall": 0.8717948717948718, |
|
"eval_runtime": 0.3737, |
|
"eval_samples_per_second": 500.35, |
|
"eval_steps_per_second": 8.027, |
|
"step": 9010 |
|
}, |
|
{ |
|
"epoch": 86.0, |
|
"grad_norm": 1.1902055740356445, |
|
"learning_rate": 7.000000000000001e-06, |
|
"loss": 0.0699, |
|
"step": 9116 |
|
}, |
|
{ |
|
"epoch": 86.0, |
|
"eval_LOCATION_f1": 0.7870967741935484, |
|
"eval_LOCATION_number": 73, |
|
"eval_LOCATION_precision": 0.7439024390243902, |
|
"eval_LOCATION_recall": 0.8356164383561644, |
|
"eval_ORGANIZATION_f1": 0.7346938775510204, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6585365853658537, |
|
"eval_ORGANIZATION_recall": 0.8307692307692308, |
|
"eval_PERSON_f1": 0.887459807073955, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8571428571428571, |
|
"eval_PERSON_recall": 0.92, |
|
"eval_QUANTITY_f1": 0.7076923076923076, |
|
"eval_QUANTITY_number": 29, |
|
"eval_QUANTITY_precision": 0.6388888888888888, |
|
"eval_QUANTITY_recall": 0.7931034482758621, |
|
"eval_TIME_f1": 0.8421052631578947, |
|
"eval_TIME_number": 34, |
|
"eval_TIME_precision": 0.7619047619047619, |
|
"eval_TIME_recall": 0.9411764705882353, |
|
"eval_loss": 0.14072592556476593, |
|
"eval_overall_accuracy": 0.958897366477972, |
|
"eval_overall_f1": 0.8169761273209548, |
|
"eval_overall_precision": 0.7642679900744417, |
|
"eval_overall_recall": 0.8774928774928775, |
|
"eval_runtime": 0.3749, |
|
"eval_samples_per_second": 498.822, |
|
"eval_steps_per_second": 8.002, |
|
"step": 9116 |
|
}, |
|
{ |
|
"epoch": 87.0, |
|
"grad_norm": 0.9288851022720337, |
|
"learning_rate": 6.5000000000000004e-06, |
|
"loss": 0.0681, |
|
"step": 9222 |
|
}, |
|
{ |
|
"epoch": 87.0, |
|
"eval_LOCATION_f1": 0.7820512820512822, |
|
"eval_LOCATION_number": 73, |
|
"eval_LOCATION_precision": 0.7349397590361446, |
|
"eval_LOCATION_recall": 0.8356164383561644, |
|
"eval_ORGANIZATION_f1": 0.7346938775510204, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6585365853658537, |
|
"eval_ORGANIZATION_recall": 0.8307692307692308, |
|
"eval_PERSON_f1": 0.887459807073955, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8571428571428571, |
|
"eval_PERSON_recall": 0.92, |
|
"eval_QUANTITY_f1": 0.71875, |
|
"eval_QUANTITY_number": 29, |
|
"eval_QUANTITY_precision": 0.6571428571428571, |
|
"eval_QUANTITY_recall": 0.7931034482758621, |
|
"eval_TIME_f1": 0.8421052631578947, |
|
"eval_TIME_number": 34, |
|
"eval_TIME_precision": 0.7619047619047619, |
|
"eval_TIME_recall": 0.9411764705882353, |
|
"eval_loss": 0.14135389029979706, |
|
"eval_overall_accuracy": 0.958897366477972, |
|
"eval_overall_f1": 0.8169761273209548, |
|
"eval_overall_precision": 0.7642679900744417, |
|
"eval_overall_recall": 0.8774928774928775, |
|
"eval_runtime": 0.3733, |
|
"eval_samples_per_second": 500.974, |
|
"eval_steps_per_second": 8.037, |
|
"step": 9222 |
|
}, |
|
{ |
|
"epoch": 88.0, |
|
"grad_norm": 1.107254981994629, |
|
"learning_rate": 6e-06, |
|
"loss": 0.0685, |
|
"step": 9328 |
|
}, |
|
{ |
|
"epoch": 88.0, |
|
"eval_LOCATION_f1": 0.7770700636942677, |
|
"eval_LOCATION_number": 73, |
|
"eval_LOCATION_precision": 0.7261904761904762, |
|
"eval_LOCATION_recall": 0.8356164383561644, |
|
"eval_ORGANIZATION_f1": 0.7346938775510204, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6585365853658537, |
|
"eval_ORGANIZATION_recall": 0.8307692307692308, |
|
"eval_PERSON_f1": 0.8846153846153846, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8518518518518519, |
|
"eval_PERSON_recall": 0.92, |
|
"eval_QUANTITY_f1": 0.7076923076923076, |
|
"eval_QUANTITY_number": 29, |
|
"eval_QUANTITY_precision": 0.6388888888888888, |
|
"eval_QUANTITY_recall": 0.7931034482758621, |
|
"eval_TIME_f1": 0.8533333333333334, |
|
"eval_TIME_number": 34, |
|
"eval_TIME_precision": 0.7804878048780488, |
|
"eval_TIME_recall": 0.9411764705882353, |
|
"eval_loss": 0.14269116520881653, |
|
"eval_overall_accuracy": 0.9579128722618755, |
|
"eval_overall_f1": 0.8148148148148149, |
|
"eval_overall_precision": 0.7604938271604939, |
|
"eval_overall_recall": 0.8774928774928775, |
|
"eval_runtime": 0.378, |
|
"eval_samples_per_second": 494.729, |
|
"eval_steps_per_second": 7.937, |
|
"step": 9328 |
|
}, |
|
{ |
|
"epoch": 89.0, |
|
"grad_norm": 2.199923276901245, |
|
"learning_rate": 5.500000000000001e-06, |
|
"loss": 0.0703, |
|
"step": 9434 |
|
}, |
|
{ |
|
"epoch": 89.0, |
|
"eval_LOCATION_f1": 0.7870967741935484, |
|
"eval_LOCATION_number": 73, |
|
"eval_LOCATION_precision": 0.7439024390243902, |
|
"eval_LOCATION_recall": 0.8356164383561644, |
|
"eval_ORGANIZATION_f1": 0.7310344827586207, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6625, |
|
"eval_ORGANIZATION_recall": 0.8153846153846154, |
|
"eval_PERSON_f1": 0.887459807073955, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8571428571428571, |
|
"eval_PERSON_recall": 0.92, |
|
"eval_QUANTITY_f1": 0.7076923076923076, |
|
"eval_QUANTITY_number": 29, |
|
"eval_QUANTITY_precision": 0.6388888888888888, |
|
"eval_QUANTITY_recall": 0.7931034482758621, |
|
"eval_TIME_f1": 0.8648648648648648, |
|
"eval_TIME_number": 34, |
|
"eval_TIME_precision": 0.8, |
|
"eval_TIME_recall": 0.9411764705882353, |
|
"eval_loss": 0.14063221216201782, |
|
"eval_overall_accuracy": 0.9593896135860202, |
|
"eval_overall_f1": 0.8186666666666667, |
|
"eval_overall_precision": 0.7694235588972431, |
|
"eval_overall_recall": 0.8746438746438746, |
|
"eval_runtime": 0.3757, |
|
"eval_samples_per_second": 497.751, |
|
"eval_steps_per_second": 7.985, |
|
"step": 9434 |
|
}, |
|
{ |
|
"epoch": 90.0, |
|
"grad_norm": 1.6066433191299438, |
|
"learning_rate": 5e-06, |
|
"loss": 0.0695, |
|
"step": 9540 |
|
}, |
|
{ |
|
"epoch": 90.0, |
|
"eval_LOCATION_f1": 0.7870967741935484, |
|
"eval_LOCATION_number": 73, |
|
"eval_LOCATION_precision": 0.7439024390243902, |
|
"eval_LOCATION_recall": 0.8356164383561644, |
|
"eval_ORGANIZATION_f1": 0.726027397260274, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.654320987654321, |
|
"eval_ORGANIZATION_recall": 0.8153846153846154, |
|
"eval_PERSON_f1": 0.887459807073955, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8571428571428571, |
|
"eval_PERSON_recall": 0.92, |
|
"eval_QUANTITY_f1": 0.7076923076923076, |
|
"eval_QUANTITY_number": 29, |
|
"eval_QUANTITY_precision": 0.6388888888888888, |
|
"eval_QUANTITY_recall": 0.7931034482758621, |
|
"eval_TIME_f1": 0.8767123287671232, |
|
"eval_TIME_number": 34, |
|
"eval_TIME_precision": 0.8205128205128205, |
|
"eval_TIME_recall": 0.9411764705882353, |
|
"eval_loss": 0.13843446969985962, |
|
"eval_overall_accuracy": 0.9601279842480925, |
|
"eval_overall_f1": 0.8186666666666667, |
|
"eval_overall_precision": 0.7694235588972431, |
|
"eval_overall_recall": 0.8746438746438746, |
|
"eval_runtime": 0.3746, |
|
"eval_samples_per_second": 499.225, |
|
"eval_steps_per_second": 8.009, |
|
"step": 9540 |
|
}, |
|
{ |
|
"epoch": 91.0, |
|
"grad_norm": 1.384969711303711, |
|
"learning_rate": 4.5e-06, |
|
"loss": 0.0684, |
|
"step": 9646 |
|
}, |
|
{ |
|
"epoch": 91.0, |
|
"eval_LOCATION_f1": 0.7770700636942677, |
|
"eval_LOCATION_number": 73, |
|
"eval_LOCATION_precision": 0.7261904761904762, |
|
"eval_LOCATION_recall": 0.8356164383561644, |
|
"eval_ORGANIZATION_f1": 0.7210884353741497, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6463414634146342, |
|
"eval_ORGANIZATION_recall": 0.8153846153846154, |
|
"eval_PERSON_f1": 0.8817891373801918, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8466257668711656, |
|
"eval_PERSON_recall": 0.92, |
|
"eval_QUANTITY_f1": 0.7076923076923076, |
|
"eval_QUANTITY_number": 29, |
|
"eval_QUANTITY_precision": 0.6388888888888888, |
|
"eval_QUANTITY_recall": 0.7931034482758621, |
|
"eval_TIME_f1": 0.8421052631578947, |
|
"eval_TIME_number": 34, |
|
"eval_TIME_precision": 0.7619047619047619, |
|
"eval_TIME_recall": 0.9411764705882353, |
|
"eval_loss": 0.14361019432544708, |
|
"eval_overall_accuracy": 0.956928378045779, |
|
"eval_overall_f1": 0.8100263852242744, |
|
"eval_overall_precision": 0.7542997542997543, |
|
"eval_overall_recall": 0.8746438746438746, |
|
"eval_runtime": 0.3739, |
|
"eval_samples_per_second": 500.193, |
|
"eval_steps_per_second": 8.024, |
|
"step": 9646 |
|
}, |
|
{ |
|
"epoch": 92.0, |
|
"grad_norm": 1.5777561664581299, |
|
"learning_rate": 4.000000000000001e-06, |
|
"loss": 0.0681, |
|
"step": 9752 |
|
}, |
|
{ |
|
"epoch": 92.0, |
|
"eval_LOCATION_f1": 0.7870967741935484, |
|
"eval_LOCATION_number": 73, |
|
"eval_LOCATION_precision": 0.7439024390243902, |
|
"eval_LOCATION_recall": 0.8356164383561644, |
|
"eval_ORGANIZATION_f1": 0.726027397260274, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.654320987654321, |
|
"eval_ORGANIZATION_recall": 0.8153846153846154, |
|
"eval_PERSON_f1": 0.887459807073955, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8571428571428571, |
|
"eval_PERSON_recall": 0.92, |
|
"eval_QUANTITY_f1": 0.7076923076923076, |
|
"eval_QUANTITY_number": 29, |
|
"eval_QUANTITY_precision": 0.6388888888888888, |
|
"eval_QUANTITY_recall": 0.7931034482758621, |
|
"eval_TIME_f1": 0.8533333333333334, |
|
"eval_TIME_number": 34, |
|
"eval_TIME_precision": 0.7804878048780488, |
|
"eval_TIME_recall": 0.9411764705882353, |
|
"eval_loss": 0.14141333103179932, |
|
"eval_overall_accuracy": 0.9591434900319961, |
|
"eval_overall_f1": 0.8164893617021275, |
|
"eval_overall_precision": 0.7655860349127181, |
|
"eval_overall_recall": 0.8746438746438746, |
|
"eval_runtime": 0.3754, |
|
"eval_samples_per_second": 498.089, |
|
"eval_steps_per_second": 7.991, |
|
"step": 9752 |
|
}, |
|
{ |
|
"epoch": 93.0, |
|
"grad_norm": 0.12837229669094086, |
|
"learning_rate": 3.5000000000000004e-06, |
|
"loss": 0.0694, |
|
"step": 9858 |
|
}, |
|
{ |
|
"epoch": 93.0, |
|
"eval_LOCATION_f1": 0.7820512820512822, |
|
"eval_LOCATION_number": 73, |
|
"eval_LOCATION_precision": 0.7349397590361446, |
|
"eval_LOCATION_recall": 0.8356164383561644, |
|
"eval_ORGANIZATION_f1": 0.7346938775510204, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6585365853658537, |
|
"eval_ORGANIZATION_recall": 0.8307692307692308, |
|
"eval_PERSON_f1": 0.887459807073955, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8571428571428571, |
|
"eval_PERSON_recall": 0.92, |
|
"eval_QUANTITY_f1": 0.7076923076923076, |
|
"eval_QUANTITY_number": 29, |
|
"eval_QUANTITY_precision": 0.6388888888888888, |
|
"eval_QUANTITY_recall": 0.7931034482758621, |
|
"eval_TIME_f1": 0.8157894736842106, |
|
"eval_TIME_number": 34, |
|
"eval_TIME_precision": 0.7380952380952381, |
|
"eval_TIME_recall": 0.9117647058823529, |
|
"eval_loss": 0.14285434782505035, |
|
"eval_overall_accuracy": 0.9584051193699237, |
|
"eval_overall_f1": 0.8132450331125828, |
|
"eval_overall_precision": 0.7599009900990099, |
|
"eval_overall_recall": 0.8746438746438746, |
|
"eval_runtime": 0.3737, |
|
"eval_samples_per_second": 500.447, |
|
"eval_steps_per_second": 8.029, |
|
"step": 9858 |
|
}, |
|
{ |
|
"epoch": 94.0, |
|
"grad_norm": 1.4026833772659302, |
|
"learning_rate": 3e-06, |
|
"loss": 0.068, |
|
"step": 9964 |
|
}, |
|
{ |
|
"epoch": 94.0, |
|
"eval_LOCATION_f1": 0.7820512820512822, |
|
"eval_LOCATION_number": 73, |
|
"eval_LOCATION_precision": 0.7349397590361446, |
|
"eval_LOCATION_recall": 0.8356164383561644, |
|
"eval_ORGANIZATION_f1": 0.726027397260274, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.654320987654321, |
|
"eval_ORGANIZATION_recall": 0.8153846153846154, |
|
"eval_PERSON_f1": 0.887459807073955, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8571428571428571, |
|
"eval_PERSON_recall": 0.92, |
|
"eval_QUANTITY_f1": 0.7076923076923076, |
|
"eval_QUANTITY_number": 29, |
|
"eval_QUANTITY_precision": 0.6388888888888888, |
|
"eval_QUANTITY_recall": 0.7931034482758621, |
|
"eval_TIME_f1": 0.8421052631578947, |
|
"eval_TIME_number": 34, |
|
"eval_TIME_precision": 0.7619047619047619, |
|
"eval_TIME_recall": 0.9411764705882353, |
|
"eval_loss": 0.14125195145606995, |
|
"eval_overall_accuracy": 0.9581589958158996, |
|
"eval_overall_f1": 0.8143236074270558, |
|
"eval_overall_precision": 0.7617866004962779, |
|
"eval_overall_recall": 0.8746438746438746, |
|
"eval_runtime": 0.3714, |
|
"eval_samples_per_second": 503.459, |
|
"eval_steps_per_second": 8.077, |
|
"step": 9964 |
|
}, |
|
{ |
|
"epoch": 95.0, |
|
"grad_norm": 2.012713670730591, |
|
"learning_rate": 2.5e-06, |
|
"loss": 0.0682, |
|
"step": 10070 |
|
}, |
|
{ |
|
"epoch": 95.0, |
|
"eval_LOCATION_f1": 0.7820512820512822, |
|
"eval_LOCATION_number": 73, |
|
"eval_LOCATION_precision": 0.7349397590361446, |
|
"eval_LOCATION_recall": 0.8356164383561644, |
|
"eval_ORGANIZATION_f1": 0.7346938775510204, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6585365853658537, |
|
"eval_ORGANIZATION_recall": 0.8307692307692308, |
|
"eval_PERSON_f1": 0.887459807073955, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8571428571428571, |
|
"eval_PERSON_recall": 0.92, |
|
"eval_QUANTITY_f1": 0.7076923076923076, |
|
"eval_QUANTITY_number": 29, |
|
"eval_QUANTITY_precision": 0.6388888888888888, |
|
"eval_QUANTITY_recall": 0.7931034482758621, |
|
"eval_TIME_f1": 0.8157894736842106, |
|
"eval_TIME_number": 34, |
|
"eval_TIME_precision": 0.7380952380952381, |
|
"eval_TIME_recall": 0.9117647058823529, |
|
"eval_loss": 0.1429029256105423, |
|
"eval_overall_accuracy": 0.9581589958158996, |
|
"eval_overall_f1": 0.8132450331125828, |
|
"eval_overall_precision": 0.7599009900990099, |
|
"eval_overall_recall": 0.8746438746438746, |
|
"eval_runtime": 0.3742, |
|
"eval_samples_per_second": 499.707, |
|
"eval_steps_per_second": 8.017, |
|
"step": 10070 |
|
}, |
|
{ |
|
"epoch": 96.0, |
|
"grad_norm": 0.9533500671386719, |
|
"learning_rate": 2.0000000000000003e-06, |
|
"loss": 0.0697, |
|
"step": 10176 |
|
}, |
|
{ |
|
"epoch": 96.0, |
|
"eval_LOCATION_f1": 0.7820512820512822, |
|
"eval_LOCATION_number": 73, |
|
"eval_LOCATION_precision": 0.7349397590361446, |
|
"eval_LOCATION_recall": 0.8356164383561644, |
|
"eval_ORGANIZATION_f1": 0.726027397260274, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.654320987654321, |
|
"eval_ORGANIZATION_recall": 0.8153846153846154, |
|
"eval_PERSON_f1": 0.887459807073955, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8571428571428571, |
|
"eval_PERSON_recall": 0.92, |
|
"eval_QUANTITY_f1": 0.7076923076923076, |
|
"eval_QUANTITY_number": 29, |
|
"eval_QUANTITY_precision": 0.6388888888888888, |
|
"eval_QUANTITY_recall": 0.7931034482758621, |
|
"eval_TIME_f1": 0.8157894736842106, |
|
"eval_TIME_number": 34, |
|
"eval_TIME_precision": 0.7380952380952381, |
|
"eval_TIME_recall": 0.9117647058823529, |
|
"eval_loss": 0.14225105941295624, |
|
"eval_overall_accuracy": 0.9579128722618755, |
|
"eval_overall_f1": 0.8116710875331565, |
|
"eval_overall_precision": 0.7593052109181141, |
|
"eval_overall_recall": 0.8717948717948718, |
|
"eval_runtime": 0.3776, |
|
"eval_samples_per_second": 495.257, |
|
"eval_steps_per_second": 7.945, |
|
"step": 10176 |
|
}, |
|
{ |
|
"epoch": 97.0, |
|
"grad_norm": 0.8223116397857666, |
|
"learning_rate": 1.5e-06, |
|
"loss": 0.0672, |
|
"step": 10282 |
|
}, |
|
{ |
|
"epoch": 97.0, |
|
"eval_LOCATION_f1": 0.7820512820512822, |
|
"eval_LOCATION_number": 73, |
|
"eval_LOCATION_precision": 0.7349397590361446, |
|
"eval_LOCATION_recall": 0.8356164383561644, |
|
"eval_ORGANIZATION_f1": 0.726027397260274, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.654320987654321, |
|
"eval_ORGANIZATION_recall": 0.8153846153846154, |
|
"eval_PERSON_f1": 0.887459807073955, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8571428571428571, |
|
"eval_PERSON_recall": 0.92, |
|
"eval_QUANTITY_f1": 0.7076923076923076, |
|
"eval_QUANTITY_number": 29, |
|
"eval_QUANTITY_precision": 0.6388888888888888, |
|
"eval_QUANTITY_recall": 0.7931034482758621, |
|
"eval_TIME_f1": 0.8157894736842106, |
|
"eval_TIME_number": 34, |
|
"eval_TIME_precision": 0.7380952380952381, |
|
"eval_TIME_recall": 0.9117647058823529, |
|
"eval_loss": 0.14218071103096008, |
|
"eval_overall_accuracy": 0.9579128722618755, |
|
"eval_overall_f1": 0.8116710875331565, |
|
"eval_overall_precision": 0.7593052109181141, |
|
"eval_overall_recall": 0.8717948717948718, |
|
"eval_runtime": 0.3739, |
|
"eval_samples_per_second": 500.069, |
|
"eval_steps_per_second": 8.022, |
|
"step": 10282 |
|
}, |
|
{ |
|
"epoch": 98.0, |
|
"grad_norm": 3.7341294288635254, |
|
"learning_rate": 1.0000000000000002e-06, |
|
"loss": 0.0674, |
|
"step": 10388 |
|
}, |
|
{ |
|
"epoch": 98.0, |
|
"eval_LOCATION_f1": 0.7820512820512822, |
|
"eval_LOCATION_number": 73, |
|
"eval_LOCATION_precision": 0.7349397590361446, |
|
"eval_LOCATION_recall": 0.8356164383561644, |
|
"eval_ORGANIZATION_f1": 0.7346938775510204, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6585365853658537, |
|
"eval_ORGANIZATION_recall": 0.8307692307692308, |
|
"eval_PERSON_f1": 0.887459807073955, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8571428571428571, |
|
"eval_PERSON_recall": 0.92, |
|
"eval_QUANTITY_f1": 0.7076923076923076, |
|
"eval_QUANTITY_number": 29, |
|
"eval_QUANTITY_precision": 0.6388888888888888, |
|
"eval_QUANTITY_recall": 0.7931034482758621, |
|
"eval_TIME_f1": 0.8157894736842106, |
|
"eval_TIME_number": 34, |
|
"eval_TIME_precision": 0.7380952380952381, |
|
"eval_TIME_recall": 0.9117647058823529, |
|
"eval_loss": 0.14276809990406036, |
|
"eval_overall_accuracy": 0.9584051193699237, |
|
"eval_overall_f1": 0.8132450331125828, |
|
"eval_overall_precision": 0.7599009900990099, |
|
"eval_overall_recall": 0.8746438746438746, |
|
"eval_runtime": 0.3733, |
|
"eval_samples_per_second": 500.927, |
|
"eval_steps_per_second": 8.036, |
|
"step": 10388 |
|
}, |
|
{ |
|
"epoch": 99.0, |
|
"grad_norm": 0.9920492768287659, |
|
"learning_rate": 5.000000000000001e-07, |
|
"loss": 0.0666, |
|
"step": 10494 |
|
}, |
|
{ |
|
"epoch": 99.0, |
|
"eval_LOCATION_f1": 0.7820512820512822, |
|
"eval_LOCATION_number": 73, |
|
"eval_LOCATION_precision": 0.7349397590361446, |
|
"eval_LOCATION_recall": 0.8356164383561644, |
|
"eval_ORGANIZATION_f1": 0.726027397260274, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.654320987654321, |
|
"eval_ORGANIZATION_recall": 0.8153846153846154, |
|
"eval_PERSON_f1": 0.887459807073955, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8571428571428571, |
|
"eval_PERSON_recall": 0.92, |
|
"eval_QUANTITY_f1": 0.7076923076923076, |
|
"eval_QUANTITY_number": 29, |
|
"eval_QUANTITY_precision": 0.6388888888888888, |
|
"eval_QUANTITY_recall": 0.7931034482758621, |
|
"eval_TIME_f1": 0.8157894736842106, |
|
"eval_TIME_number": 34, |
|
"eval_TIME_precision": 0.7380952380952381, |
|
"eval_TIME_recall": 0.9117647058823529, |
|
"eval_loss": 0.14194943010807037, |
|
"eval_overall_accuracy": 0.9581589958158996, |
|
"eval_overall_f1": 0.8116710875331565, |
|
"eval_overall_precision": 0.7593052109181141, |
|
"eval_overall_recall": 0.8717948717948718, |
|
"eval_runtime": 0.3735, |
|
"eval_samples_per_second": 500.685, |
|
"eval_steps_per_second": 8.032, |
|
"step": 10494 |
|
}, |
|
{ |
|
"epoch": 100.0, |
|
"grad_norm": 0.6790415644645691, |
|
"learning_rate": 0.0, |
|
"loss": 0.0693, |
|
"step": 10600 |
|
}, |
|
{ |
|
"epoch": 100.0, |
|
"eval_LOCATION_f1": 0.7820512820512822, |
|
"eval_LOCATION_number": 73, |
|
"eval_LOCATION_precision": 0.7349397590361446, |
|
"eval_LOCATION_recall": 0.8356164383561644, |
|
"eval_ORGANIZATION_f1": 0.726027397260274, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.654320987654321, |
|
"eval_ORGANIZATION_recall": 0.8153846153846154, |
|
"eval_PERSON_f1": 0.887459807073955, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8571428571428571, |
|
"eval_PERSON_recall": 0.92, |
|
"eval_QUANTITY_f1": 0.7076923076923076, |
|
"eval_QUANTITY_number": 29, |
|
"eval_QUANTITY_precision": 0.6388888888888888, |
|
"eval_QUANTITY_recall": 0.7931034482758621, |
|
"eval_TIME_f1": 0.8157894736842106, |
|
"eval_TIME_number": 34, |
|
"eval_TIME_precision": 0.7380952380952381, |
|
"eval_TIME_recall": 0.9117647058823529, |
|
"eval_loss": 0.1422806829214096, |
|
"eval_overall_accuracy": 0.9581589958158996, |
|
"eval_overall_f1": 0.8116710875331565, |
|
"eval_overall_precision": 0.7593052109181141, |
|
"eval_overall_recall": 0.8717948717948718, |
|
"eval_runtime": 0.3745, |
|
"eval_samples_per_second": 499.395, |
|
"eval_steps_per_second": 8.012, |
|
"step": 10600 |
|
}, |
|
{ |
|
"epoch": 100.0, |
|
"step": 10600, |
|
"total_flos": 4551589111445376.0, |
|
"train_loss": 0.12385802520895904, |
|
"train_runtime": 580.0713, |
|
"train_samples_per_second": 290.999, |
|
"train_steps_per_second": 18.274 |
|
} |
|
], |
|
"logging_steps": 500, |
|
"max_steps": 10600, |
|
"num_input_tokens_seen": 0, |
|
"num_train_epochs": 100, |
|
"save_steps": 500, |
|
"total_flos": 4551589111445376.0, |
|
"train_batch_size": 16, |
|
"trial_name": null, |
|
"trial_params": null |
|
} |
|
|