{ "best_metric": null, "best_model_checkpoint": null, "epoch": 100.0, "eval_steps": 500, "global_step": 9600, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 1.0, "grad_norm": 1.0622260570526123, "learning_rate": 4.9500000000000004e-05, "loss": 0.8931, "step": 96 }, { "epoch": 1.0, "eval_LOCATION_f1": 0.01694915254237288, "eval_LOCATION_number": 116, "eval_LOCATION_precision": 0.5, "eval_LOCATION_recall": 0.008620689655172414, "eval_ORGANIZATION_f1": 0.24025974025974026, "eval_ORGANIZATION_number": 158, "eval_ORGANIZATION_precision": 0.24666666666666667, "eval_ORGANIZATION_recall": 0.23417721518987342, "eval_PERSON_f1": 0.2660098522167488, "eval_PERSON_number": 124, "eval_PERSON_precision": 0.34177215189873417, "eval_PERSON_recall": 0.21774193548387097, "eval_loss": 0.402089387178421, "eval_overall_accuracy": 0.8597309909415317, "eval_overall_f1": 0.20667726550079493, "eval_overall_precision": 0.2813852813852814, "eval_overall_recall": 0.16331658291457288, "eval_runtime": 0.2477, "eval_samples_per_second": 686.279, "eval_steps_per_second": 12.111, "step": 96 }, { "epoch": 2.0, "grad_norm": 1.0000041723251343, "learning_rate": 4.9e-05, "loss": 0.3656, "step": 192 }, { "epoch": 2.0, "eval_LOCATION_f1": 0.4267782426778242, "eval_LOCATION_number": 116, "eval_LOCATION_precision": 0.4146341463414634, "eval_LOCATION_recall": 0.4396551724137931, "eval_ORGANIZATION_f1": 0.5901639344262295, "eval_ORGANIZATION_number": 158, "eval_ORGANIZATION_precision": 0.6122448979591837, "eval_ORGANIZATION_recall": 0.569620253164557, "eval_PERSON_f1": 0.5222929936305734, "eval_PERSON_number": 124, "eval_PERSON_precision": 0.43157894736842106, "eval_PERSON_recall": 0.6612903225806451, "eval_loss": 0.21696880459785461, "eval_overall_accuracy": 0.9264342574800988, "eval_overall_f1": 0.5198135198135198, "eval_overall_precision": 0.48478260869565215, "eval_overall_recall": 0.5603015075376885, "eval_runtime": 0.2423, "eval_samples_per_second": 701.523, "eval_steps_per_second": 12.38, "step": 192 }, { "epoch": 3.0, "grad_norm": 0.8752551674842834, "learning_rate": 4.85e-05, "loss": 0.2175, "step": 288 }, { "epoch": 3.0, "eval_LOCATION_f1": 0.7214611872146118, "eval_LOCATION_number": 116, "eval_LOCATION_precision": 0.7669902912621359, "eval_LOCATION_recall": 0.6810344827586207, "eval_ORGANIZATION_f1": 0.7411764705882353, "eval_ORGANIZATION_number": 158, "eval_ORGANIZATION_precision": 0.6923076923076923, "eval_ORGANIZATION_recall": 0.7974683544303798, "eval_PERSON_f1": 0.9416342412451362, "eval_PERSON_number": 124, "eval_PERSON_precision": 0.9097744360902256, "eval_PERSON_recall": 0.9758064516129032, "eval_loss": 0.11590560525655746, "eval_overall_accuracy": 0.9648641229755696, "eval_overall_f1": 0.7990196078431372, "eval_overall_precision": 0.7799043062200957, "eval_overall_recall": 0.8190954773869347, "eval_runtime": 0.2421, "eval_samples_per_second": 702.326, "eval_steps_per_second": 12.394, "step": 288 }, { "epoch": 4.0, "grad_norm": 1.105630874633789, "learning_rate": 4.8e-05, "loss": 0.152, "step": 384 }, { "epoch": 4.0, "eval_LOCATION_f1": 0.8421052631578948, "eval_LOCATION_number": 116, "eval_LOCATION_precision": 0.7938931297709924, "eval_LOCATION_recall": 0.896551724137931, "eval_ORGANIZATION_f1": 0.812121212121212, "eval_ORGANIZATION_number": 158, "eval_ORGANIZATION_precision": 0.7790697674418605, "eval_ORGANIZATION_recall": 0.8481012658227848, "eval_PERSON_f1": 0.9647058823529411, "eval_PERSON_number": 124, "eval_PERSON_precision": 0.9389312977099237, "eval_PERSON_recall": 0.9919354838709677, "eval_loss": 0.08956436812877655, "eval_overall_accuracy": 0.9706286027998902, "eval_overall_f1": 0.8677884615384615, "eval_overall_precision": 0.8317972350230415, "eval_overall_recall": 0.907035175879397, "eval_runtime": 0.243, "eval_samples_per_second": 699.575, "eval_steps_per_second": 12.345, "step": 384 }, { "epoch": 5.0, "grad_norm": 0.8573193550109863, "learning_rate": 4.75e-05, "loss": 0.1153, "step": 480 }, { "epoch": 5.0, "eval_LOCATION_f1": 0.8869565217391304, "eval_LOCATION_number": 116, "eval_LOCATION_precision": 0.8947368421052632, "eval_LOCATION_recall": 0.8793103448275862, "eval_ORGANIZATION_f1": 0.8492307692307692, "eval_ORGANIZATION_number": 158, "eval_ORGANIZATION_precision": 0.8263473053892215, "eval_ORGANIZATION_recall": 0.8734177215189873, "eval_PERSON_f1": 0.9721115537848605, "eval_PERSON_number": 124, "eval_PERSON_precision": 0.9606299212598425, "eval_PERSON_recall": 0.9838709677419355, "eval_loss": 0.06209466606378555, "eval_overall_accuracy": 0.9777655778204777, "eval_overall_f1": 0.8982630272952854, "eval_overall_precision": 0.8872549019607843, "eval_overall_recall": 0.9095477386934674, "eval_runtime": 0.2426, "eval_samples_per_second": 700.706, "eval_steps_per_second": 12.365, "step": 480 }, { "epoch": 6.0, "grad_norm": 2.2799108028411865, "learning_rate": 4.7e-05, "loss": 0.1017, "step": 576 }, { "epoch": 6.0, "eval_LOCATION_f1": 0.8806584362139918, "eval_LOCATION_number": 116, "eval_LOCATION_precision": 0.84251968503937, "eval_LOCATION_recall": 0.9224137931034483, "eval_ORGANIZATION_f1": 0.8827160493827162, "eval_ORGANIZATION_number": 158, "eval_ORGANIZATION_precision": 0.8614457831325302, "eval_ORGANIZATION_recall": 0.9050632911392406, "eval_PERSON_f1": 0.9840000000000001, "eval_PERSON_number": 124, "eval_PERSON_precision": 0.9761904761904762, "eval_PERSON_recall": 0.9919354838709677, "eval_loss": 0.04618193209171295, "eval_overall_accuracy": 0.9846280538018117, "eval_overall_f1": 0.9130966952264383, "eval_overall_precision": 0.8902147971360382, "eval_overall_recall": 0.9371859296482412, "eval_runtime": 0.2426, "eval_samples_per_second": 700.771, "eval_steps_per_second": 12.367, "step": 576 }, { "epoch": 7.0, "grad_norm": 0.5819811820983887, "learning_rate": 4.6500000000000005e-05, "loss": 0.0877, "step": 672 }, { "epoch": 7.0, "eval_LOCATION_f1": 0.9170305676855894, "eval_LOCATION_number": 116, "eval_LOCATION_precision": 0.9292035398230089, "eval_LOCATION_recall": 0.9051724137931034, "eval_ORGANIZATION_f1": 0.9164086687306501, "eval_ORGANIZATION_number": 158, "eval_ORGANIZATION_precision": 0.896969696969697, "eval_ORGANIZATION_recall": 0.9367088607594937, "eval_PERSON_f1": 0.9879518072289156, "eval_PERSON_number": 124, "eval_PERSON_precision": 0.984, "eval_PERSON_recall": 0.9919354838709677, "eval_loss": 0.04141335189342499, "eval_overall_accuracy": 0.9857260499588252, "eval_overall_f1": 0.9388264669163546, "eval_overall_precision": 0.9330024813895782, "eval_overall_recall": 0.9447236180904522, "eval_runtime": 0.2425, "eval_samples_per_second": 701.0, "eval_steps_per_second": 12.371, "step": 672 }, { "epoch": 8.0, "grad_norm": 1.0621719360351562, "learning_rate": 4.600000000000001e-05, "loss": 0.0772, "step": 768 }, { "epoch": 8.0, "eval_LOCATION_f1": 0.9152542372881356, "eval_LOCATION_number": 116, "eval_LOCATION_precision": 0.9, "eval_LOCATION_recall": 0.9310344827586207, "eval_ORGANIZATION_f1": 0.91875, "eval_ORGANIZATION_number": 158, "eval_ORGANIZATION_precision": 0.9074074074074074, "eval_ORGANIZATION_recall": 0.930379746835443, "eval_PERSON_f1": 0.9840000000000001, "eval_PERSON_number": 124, "eval_PERSON_precision": 0.9761904761904762, "eval_PERSON_recall": 0.9919354838709677, "eval_loss": 0.03698663040995598, "eval_overall_accuracy": 0.9873730441943454, "eval_overall_f1": 0.9379652605459057, "eval_overall_precision": 0.9264705882352942, "eval_overall_recall": 0.949748743718593, "eval_runtime": 0.2428, "eval_samples_per_second": 700.264, "eval_steps_per_second": 12.358, "step": 768 }, { "epoch": 9.0, "grad_norm": 0.5991101861000061, "learning_rate": 4.55e-05, "loss": 0.0747, "step": 864 }, { "epoch": 9.0, "eval_LOCATION_f1": 0.9288702928870294, "eval_LOCATION_number": 116, "eval_LOCATION_precision": 0.9024390243902439, "eval_LOCATION_recall": 0.9568965517241379, "eval_ORGANIZATION_f1": 0.9345794392523364, "eval_ORGANIZATION_number": 158, "eval_ORGANIZATION_precision": 0.9202453987730062, "eval_ORGANIZATION_recall": 0.9493670886075949, "eval_PERSON_f1": 0.9879518072289156, "eval_PERSON_number": 124, "eval_PERSON_precision": 0.984, "eval_PERSON_recall": 0.9919354838709677, "eval_loss": 0.04177405312657356, "eval_overall_accuracy": 0.9860005489980785, "eval_overall_f1": 0.9493201483312732, "eval_overall_precision": 0.9343065693430657, "eval_overall_recall": 0.964824120603015, "eval_runtime": 0.2423, "eval_samples_per_second": 701.484, "eval_steps_per_second": 12.379, "step": 864 }, { "epoch": 10.0, "grad_norm": 0.7477170825004578, "learning_rate": 4.5e-05, "loss": 0.0712, "step": 960 }, { "epoch": 10.0, "eval_LOCATION_f1": 0.9268292682926829, "eval_LOCATION_number": 116, "eval_LOCATION_precision": 0.8769230769230769, "eval_LOCATION_recall": 0.9827586206896551, "eval_ORGANIZATION_f1": 0.9329073482428115, "eval_ORGANIZATION_number": 158, "eval_ORGANIZATION_precision": 0.9419354838709677, "eval_ORGANIZATION_recall": 0.9240506329113924, "eval_PERSON_f1": 0.9840000000000001, "eval_PERSON_number": 124, "eval_PERSON_precision": 0.9761904761904762, "eval_PERSON_recall": 0.9919354838709677, "eval_loss": 0.04179945960640907, "eval_overall_accuracy": 0.9851770518803185, "eval_overall_f1": 0.9468479604449939, "eval_overall_precision": 0.9318734793187348, "eval_overall_recall": 0.9623115577889447, "eval_runtime": 0.2429, "eval_samples_per_second": 699.957, "eval_steps_per_second": 12.352, "step": 960 }, { "epoch": 11.0, "grad_norm": 0.4425092041492462, "learning_rate": 4.4500000000000004e-05, "loss": 0.0645, "step": 1056 }, { "epoch": 11.0, "eval_LOCATION_f1": 0.9191489361702128, "eval_LOCATION_number": 116, "eval_LOCATION_precision": 0.907563025210084, "eval_LOCATION_recall": 0.9310344827586207, "eval_ORGANIZATION_f1": 0.9341692789968652, "eval_ORGANIZATION_number": 158, "eval_ORGANIZATION_precision": 0.9254658385093167, "eval_ORGANIZATION_recall": 0.9430379746835443, "eval_PERSON_f1": 0.9879518072289156, "eval_PERSON_number": 124, "eval_PERSON_precision": 0.984, "eval_PERSON_recall": 0.9919354838709677, "eval_loss": 0.034665558487176895, "eval_overall_accuracy": 0.9884710403513588, "eval_overall_f1": 0.946450809464508, "eval_overall_precision": 0.9382716049382716, "eval_overall_recall": 0.9547738693467337, "eval_runtime": 0.2429, "eval_samples_per_second": 699.774, "eval_steps_per_second": 12.349, "step": 1056 }, { "epoch": 12.0, "grad_norm": 0.994752824306488, "learning_rate": 4.4000000000000006e-05, "loss": 0.0594, "step": 1152 }, { "epoch": 12.0, "eval_LOCATION_f1": 0.923076923076923, "eval_LOCATION_number": 116, "eval_LOCATION_precision": 0.9152542372881356, "eval_LOCATION_recall": 0.9310344827586207, "eval_ORGANIZATION_f1": 0.9164086687306501, "eval_ORGANIZATION_number": 158, "eval_ORGANIZATION_precision": 0.896969696969697, "eval_ORGANIZATION_recall": 0.9367088607594937, "eval_PERSON_f1": 0.9840000000000001, "eval_PERSON_number": 124, "eval_PERSON_precision": 0.9761904761904762, "eval_PERSON_recall": 0.9919354838709677, "eval_loss": 0.03453850373625755, "eval_overall_accuracy": 0.9876475432335987, "eval_overall_f1": 0.9392812887236679, "eval_overall_precision": 0.9266503667481663, "eval_overall_recall": 0.9522613065326633, "eval_runtime": 0.2433, "eval_samples_per_second": 698.803, "eval_steps_per_second": 12.332, "step": 1152 }, { "epoch": 13.0, "grad_norm": 0.3863960802555084, "learning_rate": 4.35e-05, "loss": 0.0584, "step": 1248 }, { "epoch": 13.0, "eval_LOCATION_f1": 0.927038626609442, "eval_LOCATION_number": 116, "eval_LOCATION_precision": 0.9230769230769231, "eval_LOCATION_recall": 0.9310344827586207, "eval_ORGANIZATION_f1": 0.9496855345911951, "eval_ORGANIZATION_number": 158, "eval_ORGANIZATION_precision": 0.94375, "eval_ORGANIZATION_recall": 0.9556962025316456, "eval_PERSON_f1": 0.9840000000000001, "eval_PERSON_number": 124, "eval_PERSON_precision": 0.9761904761904762, "eval_PERSON_recall": 0.9919354838709677, "eval_loss": 0.030687231570482254, "eval_overall_accuracy": 0.9906670326653857, "eval_overall_f1": 0.9538077403245941, "eval_overall_precision": 0.9478908188585607, "eval_overall_recall": 0.9597989949748744, "eval_runtime": 0.2423, "eval_samples_per_second": 701.612, "eval_steps_per_second": 12.381, "step": 1248 }, { "epoch": 14.0, "grad_norm": 0.7108584642410278, "learning_rate": 4.3e-05, "loss": 0.0533, "step": 1344 }, { "epoch": 14.0, "eval_LOCATION_f1": 0.9276595744680851, "eval_LOCATION_number": 116, "eval_LOCATION_precision": 0.9159663865546218, "eval_LOCATION_recall": 0.9396551724137931, "eval_ORGANIZATION_f1": 0.9245283018867925, "eval_ORGANIZATION_number": 158, "eval_ORGANIZATION_precision": 0.91875, "eval_ORGANIZATION_recall": 0.930379746835443, "eval_PERSON_f1": 0.9840000000000001, "eval_PERSON_number": 124, "eval_PERSON_precision": 0.9761904761904762, "eval_PERSON_recall": 0.9919354838709677, "eval_loss": 0.03466002270579338, "eval_overall_accuracy": 0.9879220422728521, "eval_overall_f1": 0.9439601494396015, "eval_overall_precision": 0.9358024691358025, "eval_overall_recall": 0.9522613065326633, "eval_runtime": 0.245, "eval_samples_per_second": 694.012, "eval_steps_per_second": 12.247, "step": 1344 }, { "epoch": 15.0, "grad_norm": 0.4726468324661255, "learning_rate": 4.25e-05, "loss": 0.051, "step": 1440 }, { "epoch": 15.0, "eval_LOCATION_f1": 0.9367088607594937, "eval_LOCATION_number": 116, "eval_LOCATION_precision": 0.9173553719008265, "eval_LOCATION_recall": 0.9568965517241379, "eval_ORGANIZATION_f1": 0.9337539432176657, "eval_ORGANIZATION_number": 158, "eval_ORGANIZATION_precision": 0.9308176100628931, "eval_ORGANIZATION_recall": 0.9367088607594937, "eval_PERSON_f1": 0.9879518072289156, "eval_PERSON_number": 124, "eval_PERSON_precision": 0.984, "eval_PERSON_recall": 0.9919354838709677, "eval_loss": 0.03434712067246437, "eval_overall_accuracy": 0.9890200384298655, "eval_overall_f1": 0.9514321295143213, "eval_overall_precision": 0.9432098765432099, "eval_overall_recall": 0.9597989949748744, "eval_runtime": 0.2429, "eval_samples_per_second": 699.91, "eval_steps_per_second": 12.351, "step": 1440 }, { "epoch": 16.0, "grad_norm": 0.5781874060630798, "learning_rate": 4.2e-05, "loss": 0.0498, "step": 1536 }, { "epoch": 16.0, "eval_LOCATION_f1": 0.9243697478991596, "eval_LOCATION_number": 116, "eval_LOCATION_precision": 0.9016393442622951, "eval_LOCATION_recall": 0.9482758620689655, "eval_ORGANIZATION_f1": 0.9196141479099678, "eval_ORGANIZATION_number": 158, "eval_ORGANIZATION_precision": 0.934640522875817, "eval_ORGANIZATION_recall": 0.9050632911392406, "eval_PERSON_f1": 0.9800796812749005, "eval_PERSON_number": 124, "eval_PERSON_precision": 0.968503937007874, "eval_PERSON_recall": 0.9919354838709677, "eval_loss": 0.03455718606710434, "eval_overall_accuracy": 0.9884710403513588, "eval_overall_f1": 0.94, "eval_overall_precision": 0.9353233830845771, "eval_overall_recall": 0.9447236180904522, "eval_runtime": 0.2432, "eval_samples_per_second": 698.89, "eval_steps_per_second": 12.333, "step": 1536 }, { "epoch": 17.0, "grad_norm": 0.1878691464662552, "learning_rate": 4.15e-05, "loss": 0.0452, "step": 1632 }, { "epoch": 17.0, "eval_LOCATION_f1": 0.925, "eval_LOCATION_number": 116, "eval_LOCATION_precision": 0.8951612903225806, "eval_LOCATION_recall": 0.9568965517241379, "eval_ORGANIZATION_f1": 0.9171974522292994, "eval_ORGANIZATION_number": 158, "eval_ORGANIZATION_precision": 0.9230769230769231, "eval_ORGANIZATION_recall": 0.9113924050632911, "eval_PERSON_f1": 0.9879518072289156, "eval_PERSON_number": 124, "eval_PERSON_precision": 0.984, "eval_PERSON_recall": 0.9919354838709677, "eval_loss": 0.035126231610774994, "eval_overall_accuracy": 0.987098545155092, "eval_overall_f1": 0.9414694894146949, "eval_overall_precision": 0.9333333333333333, "eval_overall_recall": 0.949748743718593, "eval_runtime": 0.2425, "eval_samples_per_second": 700.995, "eval_steps_per_second": 12.37, "step": 1632 }, { "epoch": 18.0, "grad_norm": 0.7006422877311707, "learning_rate": 4.1e-05, "loss": 0.0437, "step": 1728 }, { "epoch": 18.0, "eval_LOCATION_f1": 0.9282700421940928, "eval_LOCATION_number": 116, "eval_LOCATION_precision": 0.9090909090909091, "eval_LOCATION_recall": 0.9482758620689655, "eval_ORGANIZATION_f1": 0.9433962264150944, "eval_ORGANIZATION_number": 158, "eval_ORGANIZATION_precision": 0.9375, "eval_ORGANIZATION_recall": 0.9493670886075949, "eval_PERSON_f1": 0.9879518072289156, "eval_PERSON_number": 124, "eval_PERSON_precision": 0.984, "eval_PERSON_recall": 0.9919354838709677, "eval_loss": 0.035111382603645325, "eval_overall_accuracy": 0.9887455393906122, "eval_overall_f1": 0.9527363184079602, "eval_overall_precision": 0.9433497536945813, "eval_overall_recall": 0.9623115577889447, "eval_runtime": 0.2425, "eval_samples_per_second": 700.948, "eval_steps_per_second": 12.37, "step": 1728 }, { "epoch": 19.0, "grad_norm": 0.6293537616729736, "learning_rate": 4.05e-05, "loss": 0.0419, "step": 1824 }, { "epoch": 19.0, "eval_LOCATION_f1": 0.9115044247787611, "eval_LOCATION_number": 116, "eval_LOCATION_precision": 0.9363636363636364, "eval_LOCATION_recall": 0.8879310344827587, "eval_ORGANIZATION_f1": 0.9375000000000001, "eval_ORGANIZATION_number": 158, "eval_ORGANIZATION_precision": 0.9259259259259259, "eval_ORGANIZATION_recall": 0.9493670886075949, "eval_PERSON_f1": 0.9840000000000001, "eval_PERSON_number": 124, "eval_PERSON_precision": 0.9761904761904762, "eval_PERSON_recall": 0.9919354838709677, "eval_loss": 0.03315844014286995, "eval_overall_accuracy": 0.9890200384298655, "eval_overall_f1": 0.9447236180904522, "eval_overall_precision": 0.9447236180904522, "eval_overall_recall": 0.9447236180904522, "eval_runtime": 0.2423, "eval_samples_per_second": 701.628, "eval_steps_per_second": 12.382, "step": 1824 }, { "epoch": 20.0, "grad_norm": 0.43634268641471863, "learning_rate": 4e-05, "loss": 0.0409, "step": 1920 }, { "epoch": 20.0, "eval_LOCATION_f1": 0.9310344827586207, "eval_LOCATION_number": 116, "eval_LOCATION_precision": 0.9310344827586207, "eval_LOCATION_recall": 0.9310344827586207, "eval_ORGANIZATION_f1": 0.9254658385093167, "eval_ORGANIZATION_number": 158, "eval_ORGANIZATION_precision": 0.9085365853658537, "eval_ORGANIZATION_recall": 0.9430379746835443, "eval_PERSON_f1": 0.9840000000000001, "eval_PERSON_number": 124, "eval_PERSON_precision": 0.9761904761904762, "eval_PERSON_recall": 0.9919354838709677, "eval_loss": 0.035573337227106094, "eval_overall_accuracy": 0.9890200384298655, "eval_overall_f1": 0.945273631840796, "eval_overall_precision": 0.9359605911330049, "eval_overall_recall": 0.9547738693467337, "eval_runtime": 0.2427, "eval_samples_per_second": 700.581, "eval_steps_per_second": 12.363, "step": 1920 }, { "epoch": 21.0, "grad_norm": 1.104005217552185, "learning_rate": 3.9500000000000005e-05, "loss": 0.0403, "step": 2016 }, { "epoch": 21.0, "eval_LOCATION_f1": 0.925, "eval_LOCATION_number": 116, "eval_LOCATION_precision": 0.8951612903225806, "eval_LOCATION_recall": 0.9568965517241379, "eval_ORGANIZATION_f1": 0.9294871794871796, "eval_ORGANIZATION_number": 158, "eval_ORGANIZATION_precision": 0.9415584415584416, "eval_ORGANIZATION_recall": 0.9177215189873418, "eval_PERSON_f1": 0.9879518072289156, "eval_PERSON_number": 124, "eval_PERSON_precision": 0.984, "eval_PERSON_recall": 0.9919354838709677, "eval_loss": 0.02913746051490307, "eval_overall_accuracy": 0.9890200384298655, "eval_overall_f1": 0.9463171036204745, "eval_overall_precision": 0.9404466501240695, "eval_overall_recall": 0.9522613065326633, "eval_runtime": 0.2423, "eval_samples_per_second": 701.518, "eval_steps_per_second": 12.38, "step": 2016 }, { "epoch": 22.0, "grad_norm": 0.9109427332878113, "learning_rate": 3.9000000000000006e-05, "loss": 0.0368, "step": 2112 }, { "epoch": 22.0, "eval_LOCATION_f1": 0.9304347826086956, "eval_LOCATION_number": 116, "eval_LOCATION_precision": 0.9385964912280702, "eval_LOCATION_recall": 0.9224137931034483, "eval_ORGANIZATION_f1": 0.9337539432176657, "eval_ORGANIZATION_number": 158, "eval_ORGANIZATION_precision": 0.9308176100628931, "eval_ORGANIZATION_recall": 0.9367088607594937, "eval_PERSON_f1": 0.9800796812749005, "eval_PERSON_number": 124, "eval_PERSON_precision": 0.968503937007874, "eval_PERSON_recall": 0.9919354838709677, "eval_loss": 0.03580503910779953, "eval_overall_accuracy": 0.9895690365083722, "eval_overall_f1": 0.9473684210526316, "eval_overall_precision": 0.945, "eval_overall_recall": 0.949748743718593, "eval_runtime": 0.2428, "eval_samples_per_second": 700.269, "eval_steps_per_second": 12.358, "step": 2112 }, { "epoch": 23.0, "grad_norm": 0.4533730745315552, "learning_rate": 3.85e-05, "loss": 0.0402, "step": 2208 }, { "epoch": 23.0, "eval_LOCATION_f1": 0.9531914893617022, "eval_LOCATION_number": 116, "eval_LOCATION_precision": 0.9411764705882353, "eval_LOCATION_recall": 0.9655172413793104, "eval_ORGANIZATION_f1": 0.9337539432176657, "eval_ORGANIZATION_number": 158, "eval_ORGANIZATION_precision": 0.9308176100628931, "eval_ORGANIZATION_recall": 0.9367088607594937, "eval_PERSON_f1": 0.9840000000000001, "eval_PERSON_number": 124, "eval_PERSON_precision": 0.9761904761904762, "eval_PERSON_recall": 0.9919354838709677, "eval_loss": 0.02975594624876976, "eval_overall_accuracy": 0.9903925336261323, "eval_overall_f1": 0.9551122194513715, "eval_overall_precision": 0.948019801980198, "eval_overall_recall": 0.9623115577889447, "eval_runtime": 0.2418, "eval_samples_per_second": 703.141, "eval_steps_per_second": 12.408, "step": 2208 }, { "epoch": 24.0, "grad_norm": 0.4602113962173462, "learning_rate": 3.8e-05, "loss": 0.0353, "step": 2304 }, { "epoch": 24.0, "eval_LOCATION_f1": 0.9406779661016949, "eval_LOCATION_number": 116, "eval_LOCATION_precision": 0.925, "eval_LOCATION_recall": 0.9568965517241379, "eval_ORGANIZATION_f1": 0.9363057324840764, "eval_ORGANIZATION_number": 158, "eval_ORGANIZATION_precision": 0.9423076923076923, "eval_ORGANIZATION_recall": 0.930379746835443, "eval_PERSON_f1": 0.9879518072289156, "eval_PERSON_number": 124, "eval_PERSON_precision": 0.984, "eval_PERSON_recall": 0.9919354838709677, "eval_loss": 0.03227541968226433, "eval_overall_accuracy": 0.9895690365083722, "eval_overall_f1": 0.9536921151439299, "eval_overall_precision": 0.9501246882793017, "eval_overall_recall": 0.957286432160804, "eval_runtime": 0.2439, "eval_samples_per_second": 696.954, "eval_steps_per_second": 12.299, "step": 2304 }, { "epoch": 25.0, "grad_norm": 0.7048800587654114, "learning_rate": 3.7500000000000003e-05, "loss": 0.0332, "step": 2400 }, { "epoch": 25.0, "eval_LOCATION_f1": 0.9456066945606694, "eval_LOCATION_number": 116, "eval_LOCATION_precision": 0.9186991869918699, "eval_LOCATION_recall": 0.9741379310344828, "eval_ORGANIZATION_f1": 0.9003215434083601, "eval_ORGANIZATION_number": 158, "eval_ORGANIZATION_precision": 0.9150326797385621, "eval_ORGANIZATION_recall": 0.8860759493670886, "eval_PERSON_f1": 0.9840000000000001, "eval_PERSON_number": 124, "eval_PERSON_precision": 0.9761904761904762, "eval_PERSON_recall": 0.9919354838709677, "eval_loss": 0.03731263801455498, "eval_overall_accuracy": 0.9887455393906122, "eval_overall_f1": 0.94, "eval_overall_precision": 0.9353233830845771, "eval_overall_recall": 0.9447236180904522, "eval_runtime": 0.2428, "eval_samples_per_second": 700.288, "eval_steps_per_second": 12.358, "step": 2400 }, { "epoch": 26.0, "grad_norm": 0.6570234894752502, "learning_rate": 3.7e-05, "loss": 0.0343, "step": 2496 }, { "epoch": 26.0, "eval_LOCATION_f1": 0.9406779661016949, "eval_LOCATION_number": 116, "eval_LOCATION_precision": 0.925, "eval_LOCATION_recall": 0.9568965517241379, "eval_ORGANIZATION_f1": 0.9211356466876972, "eval_ORGANIZATION_number": 158, "eval_ORGANIZATION_precision": 0.9182389937106918, "eval_ORGANIZATION_recall": 0.9240506329113924, "eval_PERSON_f1": 0.9879518072289156, "eval_PERSON_number": 124, "eval_PERSON_precision": 0.984, "eval_PERSON_recall": 0.9919354838709677, "eval_loss": 0.040523938834667206, "eval_overall_accuracy": 0.9884710403513588, "eval_overall_f1": 0.9476309226932669, "eval_overall_precision": 0.9405940594059405, "eval_overall_recall": 0.9547738693467337, "eval_runtime": 0.2423, "eval_samples_per_second": 701.468, "eval_steps_per_second": 12.379, "step": 2496 }, { "epoch": 27.0, "grad_norm": 0.9857751131057739, "learning_rate": 3.65e-05, "loss": 0.0342, "step": 2592 }, { "epoch": 27.0, "eval_LOCATION_f1": 0.9406779661016949, "eval_LOCATION_number": 116, "eval_LOCATION_precision": 0.925, "eval_LOCATION_recall": 0.9568965517241379, "eval_ORGANIZATION_f1": 0.9363057324840764, "eval_ORGANIZATION_number": 158, "eval_ORGANIZATION_precision": 0.9423076923076923, "eval_ORGANIZATION_recall": 0.930379746835443, "eval_PERSON_f1": 0.9800796812749005, "eval_PERSON_number": 124, "eval_PERSON_precision": 0.968503937007874, "eval_PERSON_recall": 0.9919354838709677, "eval_loss": 0.03457554057240486, "eval_overall_accuracy": 0.9887455393906122, "eval_overall_f1": 0.951310861423221, "eval_overall_precision": 0.9454094292803971, "eval_overall_recall": 0.957286432160804, "eval_runtime": 0.2421, "eval_samples_per_second": 702.06, "eval_steps_per_second": 12.389, "step": 2592 }, { "epoch": 28.0, "grad_norm": 0.46330365538597107, "learning_rate": 3.6e-05, "loss": 0.032, "step": 2688 }, { "epoch": 28.0, "eval_LOCATION_f1": 0.923076923076923, "eval_LOCATION_number": 116, "eval_LOCATION_precision": 0.9152542372881356, "eval_LOCATION_recall": 0.9310344827586207, "eval_ORGANIZATION_f1": 0.9299363057324842, "eval_ORGANIZATION_number": 158, "eval_ORGANIZATION_precision": 0.9358974358974359, "eval_ORGANIZATION_recall": 0.9240506329113924, "eval_PERSON_f1": 0.9800796812749005, "eval_PERSON_number": 124, "eval_PERSON_precision": 0.968503937007874, "eval_PERSON_recall": 0.9919354838709677, "eval_loss": 0.04411082714796066, "eval_overall_accuracy": 0.987098545155092, "eval_overall_f1": 0.9436795994993743, "eval_overall_precision": 0.940149625935162, "eval_overall_recall": 0.9472361809045227, "eval_runtime": 0.2418, "eval_samples_per_second": 703.003, "eval_steps_per_second": 12.406, "step": 2688 }, { "epoch": 29.0, "grad_norm": 0.4757544696331024, "learning_rate": 3.55e-05, "loss": 0.0275, "step": 2784 }, { "epoch": 29.0, "eval_LOCATION_f1": 0.9396551724137931, "eval_LOCATION_number": 116, "eval_LOCATION_precision": 0.9396551724137931, "eval_LOCATION_recall": 0.9396551724137931, "eval_ORGANIZATION_f1": 0.9221183800623053, "eval_ORGANIZATION_number": 158, "eval_ORGANIZATION_precision": 0.9079754601226994, "eval_ORGANIZATION_recall": 0.9367088607594937, "eval_PERSON_f1": 0.9879518072289156, "eval_PERSON_number": 124, "eval_PERSON_precision": 0.984, "eval_PERSON_recall": 0.9919354838709677, "eval_loss": 0.04470400512218475, "eval_overall_accuracy": 0.9876475432335987, "eval_overall_f1": 0.9476309226932669, "eval_overall_precision": 0.9405940594059405, "eval_overall_recall": 0.9547738693467337, "eval_runtime": 0.242, "eval_samples_per_second": 702.55, "eval_steps_per_second": 12.398, "step": 2784 }, { "epoch": 30.0, "grad_norm": 1.0357615947723389, "learning_rate": 3.5e-05, "loss": 0.0273, "step": 2880 }, { "epoch": 30.0, "eval_LOCATION_f1": 0.9304347826086956, "eval_LOCATION_number": 116, "eval_LOCATION_precision": 0.9385964912280702, "eval_LOCATION_recall": 0.9224137931034483, "eval_ORGANIZATION_f1": 0.9316770186335404, "eval_ORGANIZATION_number": 158, "eval_ORGANIZATION_precision": 0.9146341463414634, "eval_ORGANIZATION_recall": 0.9493670886075949, "eval_PERSON_f1": 0.9879518072289156, "eval_PERSON_number": 124, "eval_PERSON_precision": 0.984, "eval_PERSON_recall": 0.9919354838709677, "eval_loss": 0.043819691985845566, "eval_overall_accuracy": 0.9884710403513588, "eval_overall_f1": 0.9488139825218478, "eval_overall_precision": 0.9429280397022333, "eval_overall_recall": 0.9547738693467337, "eval_runtime": 0.2421, "eval_samples_per_second": 702.271, "eval_steps_per_second": 12.393, "step": 2880 }, { "epoch": 31.0, "grad_norm": 0.5754586458206177, "learning_rate": 3.45e-05, "loss": 0.0287, "step": 2976 }, { "epoch": 31.0, "eval_LOCATION_f1": 0.9411764705882353, "eval_LOCATION_number": 116, "eval_LOCATION_precision": 0.9180327868852459, "eval_LOCATION_recall": 0.9655172413793104, "eval_ORGANIZATION_f1": 0.9290322580645162, "eval_ORGANIZATION_number": 158, "eval_ORGANIZATION_precision": 0.9473684210526315, "eval_ORGANIZATION_recall": 0.9113924050632911, "eval_PERSON_f1": 0.9840000000000001, "eval_PERSON_number": 124, "eval_PERSON_precision": 0.9761904761904762, "eval_PERSON_recall": 0.9919354838709677, "eval_loss": 0.035712841898202896, "eval_overall_accuracy": 0.990118034586879, "eval_overall_f1": 0.9498746867167919, "eval_overall_precision": 0.9475, "eval_overall_recall": 0.9522613065326633, "eval_runtime": 0.242, "eval_samples_per_second": 702.469, "eval_steps_per_second": 12.397, "step": 2976 }, { "epoch": 32.0, "grad_norm": 0.4603827893733978, "learning_rate": 3.4000000000000007e-05, "loss": 0.0274, "step": 3072 }, { "epoch": 32.0, "eval_LOCATION_f1": 0.9288702928870294, "eval_LOCATION_number": 116, "eval_LOCATION_precision": 0.9024390243902439, "eval_LOCATION_recall": 0.9568965517241379, "eval_ORGANIZATION_f1": 0.9131832797427653, "eval_ORGANIZATION_number": 158, "eval_ORGANIZATION_precision": 0.9281045751633987, "eval_ORGANIZATION_recall": 0.8987341772151899, "eval_PERSON_f1": 0.9840000000000001, "eval_PERSON_number": 124, "eval_PERSON_precision": 0.9761904761904762, "eval_PERSON_recall": 0.9919354838709677, "eval_loss": 0.04034664109349251, "eval_overall_accuracy": 0.9881965413121054, "eval_overall_f1": 0.94, "eval_overall_precision": 0.9353233830845771, "eval_overall_recall": 0.9447236180904522, "eval_runtime": 0.2418, "eval_samples_per_second": 703.177, "eval_steps_per_second": 12.409, "step": 3072 }, { "epoch": 33.0, "grad_norm": 0.4669646620750427, "learning_rate": 3.35e-05, "loss": 0.0284, "step": 3168 }, { "epoch": 33.0, "eval_LOCATION_f1": 0.9327731092436975, "eval_LOCATION_number": 116, "eval_LOCATION_precision": 0.9098360655737705, "eval_LOCATION_recall": 0.9568965517241379, "eval_ORGANIZATION_f1": 0.9196141479099678, "eval_ORGANIZATION_number": 158, "eval_ORGANIZATION_precision": 0.934640522875817, "eval_ORGANIZATION_recall": 0.9050632911392406, "eval_PERSON_f1": 0.9840000000000001, "eval_PERSON_number": 124, "eval_PERSON_precision": 0.9761904761904762, "eval_PERSON_recall": 0.9919354838709677, "eval_loss": 0.04073726758360863, "eval_overall_accuracy": 0.9879220422728521, "eval_overall_f1": 0.9436795994993743, "eval_overall_precision": 0.940149625935162, "eval_overall_recall": 0.9472361809045227, "eval_runtime": 0.2426, "eval_samples_per_second": 700.664, "eval_steps_per_second": 12.365, "step": 3168 }, { "epoch": 34.0, "grad_norm": 0.14242352545261383, "learning_rate": 3.3e-05, "loss": 0.0269, "step": 3264 }, { "epoch": 34.0, "eval_LOCATION_f1": 0.9406779661016949, "eval_LOCATION_number": 116, "eval_LOCATION_precision": 0.925, "eval_LOCATION_recall": 0.9568965517241379, "eval_ORGANIZATION_f1": 0.9312499999999999, "eval_ORGANIZATION_number": 158, "eval_ORGANIZATION_precision": 0.9197530864197531, "eval_ORGANIZATION_recall": 0.9430379746835443, "eval_PERSON_f1": 0.9879518072289156, "eval_PERSON_number": 124, "eval_PERSON_precision": 0.984, "eval_PERSON_recall": 0.9919354838709677, "eval_loss": 0.04001469165086746, "eval_overall_accuracy": 0.9895690365083722, "eval_overall_f1": 0.9515527950310558, "eval_overall_precision": 0.941031941031941, "eval_overall_recall": 0.9623115577889447, "eval_runtime": 0.2432, "eval_samples_per_second": 698.955, "eval_steps_per_second": 12.334, "step": 3264 }, { "epoch": 35.0, "grad_norm": 0.5518023371696472, "learning_rate": 3.2500000000000004e-05, "loss": 0.0245, "step": 3360 }, { "epoch": 35.0, "eval_LOCATION_f1": 0.935064935064935, "eval_LOCATION_number": 116, "eval_LOCATION_precision": 0.9391304347826087, "eval_LOCATION_recall": 0.9310344827586207, "eval_ORGANIZATION_f1": 0.9226006191950465, "eval_ORGANIZATION_number": 158, "eval_ORGANIZATION_precision": 0.9030303030303031, "eval_ORGANIZATION_recall": 0.9430379746835443, "eval_PERSON_f1": 0.9840000000000001, "eval_PERSON_number": 124, "eval_PERSON_precision": 0.9761904761904762, "eval_PERSON_recall": 0.9919354838709677, "eval_loss": 0.03874511644244194, "eval_overall_accuracy": 0.9884710403513588, "eval_overall_f1": 0.945273631840796, "eval_overall_precision": 0.9359605911330049, "eval_overall_recall": 0.9547738693467337, "eval_runtime": 0.2431, "eval_samples_per_second": 699.42, "eval_steps_per_second": 12.343, "step": 3360 }, { "epoch": 36.0, "grad_norm": 1.2177473306655884, "learning_rate": 3.2000000000000005e-05, "loss": 0.0251, "step": 3456 }, { "epoch": 36.0, "eval_LOCATION_f1": 0.9406779661016949, "eval_LOCATION_number": 116, "eval_LOCATION_precision": 0.925, "eval_LOCATION_recall": 0.9568965517241379, "eval_ORGANIZATION_f1": 0.9308176100628932, "eval_ORGANIZATION_number": 158, "eval_ORGANIZATION_precision": 0.925, "eval_ORGANIZATION_recall": 0.9367088607594937, "eval_PERSON_f1": 0.9879518072289156, "eval_PERSON_number": 124, "eval_PERSON_precision": 0.984, "eval_PERSON_recall": 0.9919354838709677, "eval_loss": 0.03678901121020317, "eval_overall_accuracy": 0.9895690365083722, "eval_overall_f1": 0.9514321295143213, "eval_overall_precision": 0.9432098765432099, "eval_overall_recall": 0.9597989949748744, "eval_runtime": 0.2423, "eval_samples_per_second": 701.694, "eval_steps_per_second": 12.383, "step": 3456 }, { "epoch": 37.0, "grad_norm": 1.4173684120178223, "learning_rate": 3.15e-05, "loss": 0.0243, "step": 3552 }, { "epoch": 37.0, "eval_LOCATION_f1": 0.9356223175965666, "eval_LOCATION_number": 116, "eval_LOCATION_precision": 0.9316239316239316, "eval_LOCATION_recall": 0.9396551724137931, "eval_ORGANIZATION_f1": 0.9333333333333332, "eval_ORGANIZATION_number": 158, "eval_ORGANIZATION_precision": 0.9363057324840764, "eval_ORGANIZATION_recall": 0.930379746835443, "eval_PERSON_f1": 0.9800796812749005, "eval_PERSON_number": 124, "eval_PERSON_precision": 0.968503937007874, "eval_PERSON_recall": 0.9919354838709677, "eval_loss": 0.03889763355255127, "eval_overall_accuracy": 0.9895690365083722, "eval_overall_f1": 0.9486858573216519, "eval_overall_precision": 0.9451371571072319, "eval_overall_recall": 0.9522613065326633, "eval_runtime": 0.2444, "eval_samples_per_second": 695.549, "eval_steps_per_second": 12.274, "step": 3552 }, { "epoch": 38.0, "grad_norm": 0.6296694874763489, "learning_rate": 3.1e-05, "loss": 0.0242, "step": 3648 }, { "epoch": 38.0, "eval_LOCATION_f1": 0.9113924050632911, "eval_LOCATION_number": 116, "eval_LOCATION_precision": 0.8925619834710744, "eval_LOCATION_recall": 0.9310344827586207, "eval_ORGANIZATION_f1": 0.9235668789808917, "eval_ORGANIZATION_number": 158, "eval_ORGANIZATION_precision": 0.9294871794871795, "eval_ORGANIZATION_recall": 0.9177215189873418, "eval_PERSON_f1": 0.9840000000000001, "eval_PERSON_number": 124, "eval_PERSON_precision": 0.9761904761904762, "eval_PERSON_recall": 0.9919354838709677, "eval_loss": 0.04012976959347725, "eval_overall_accuracy": 0.9879220422728521, "eval_overall_f1": 0.9388264669163546, "eval_overall_precision": 0.9330024813895782, "eval_overall_recall": 0.9447236180904522, "eval_runtime": 0.2429, "eval_samples_per_second": 699.989, "eval_steps_per_second": 12.353, "step": 3648 }, { "epoch": 39.0, "grad_norm": 0.07241743803024292, "learning_rate": 3.05e-05, "loss": 0.0244, "step": 3744 }, { "epoch": 39.0, "eval_LOCATION_f1": 0.9406779661016949, "eval_LOCATION_number": 116, "eval_LOCATION_precision": 0.925, "eval_LOCATION_recall": 0.9568965517241379, "eval_ORGANIZATION_f1": 0.9329073482428115, "eval_ORGANIZATION_number": 158, "eval_ORGANIZATION_precision": 0.9419354838709677, "eval_ORGANIZATION_recall": 0.9240506329113924, "eval_PERSON_f1": 0.9800796812749005, "eval_PERSON_number": 124, "eval_PERSON_precision": 0.968503937007874, "eval_PERSON_recall": 0.9919354838709677, "eval_loss": 0.04065397381782532, "eval_overall_accuracy": 0.9876475432335987, "eval_overall_f1": 0.95, "eval_overall_precision": 0.945273631840796, "eval_overall_recall": 0.9547738693467337, "eval_runtime": 0.2421, "eval_samples_per_second": 702.128, "eval_steps_per_second": 12.39, "step": 3744 }, { "epoch": 40.0, "grad_norm": 0.13085119426250458, "learning_rate": 3e-05, "loss": 0.0211, "step": 3840 }, { "epoch": 40.0, "eval_LOCATION_f1": 0.9361702127659575, "eval_LOCATION_number": 116, "eval_LOCATION_precision": 0.9243697478991597, "eval_LOCATION_recall": 0.9482758620689655, "eval_ORGANIZATION_f1": 0.9375000000000001, "eval_ORGANIZATION_number": 158, "eval_ORGANIZATION_precision": 0.9259259259259259, "eval_ORGANIZATION_recall": 0.9493670886075949, "eval_PERSON_f1": 0.9840000000000001, "eval_PERSON_number": 124, "eval_PERSON_precision": 0.9761904761904762, "eval_PERSON_recall": 0.9919354838709677, "eval_loss": 0.04333576187491417, "eval_overall_accuracy": 0.9890200384298655, "eval_overall_f1": 0.9515527950310558, "eval_overall_precision": 0.941031941031941, "eval_overall_recall": 0.9623115577889447, "eval_runtime": 0.2428, "eval_samples_per_second": 700.162, "eval_steps_per_second": 12.356, "step": 3840 }, { "epoch": 41.0, "grad_norm": 0.029861435294151306, "learning_rate": 2.95e-05, "loss": 0.0223, "step": 3936 }, { "epoch": 41.0, "eval_LOCATION_f1": 0.944206008583691, "eval_LOCATION_number": 116, "eval_LOCATION_precision": 0.9401709401709402, "eval_LOCATION_recall": 0.9482758620689655, "eval_ORGANIZATION_f1": 0.9278996865203761, "eval_ORGANIZATION_number": 158, "eval_ORGANIZATION_precision": 0.9192546583850931, "eval_ORGANIZATION_recall": 0.9367088607594937, "eval_PERSON_f1": 0.9840000000000001, "eval_PERSON_number": 124, "eval_PERSON_precision": 0.9761904761904762, "eval_PERSON_recall": 0.9919354838709677, "eval_loss": 0.03654933720827103, "eval_overall_accuracy": 0.9892945374691189, "eval_overall_f1": 0.9501246882793017, "eval_overall_precision": 0.943069306930693, "eval_overall_recall": 0.957286432160804, "eval_runtime": 0.2424, "eval_samples_per_second": 701.253, "eval_steps_per_second": 12.375, "step": 3936 }, { "epoch": 42.0, "grad_norm": 0.09470277279615402, "learning_rate": 2.9e-05, "loss": 0.0224, "step": 4032 }, { "epoch": 42.0, "eval_LOCATION_f1": 0.94017094017094, "eval_LOCATION_number": 116, "eval_LOCATION_precision": 0.9322033898305084, "eval_LOCATION_recall": 0.9482758620689655, "eval_ORGANIZATION_f1": 0.9278996865203761, "eval_ORGANIZATION_number": 158, "eval_ORGANIZATION_precision": 0.9192546583850931, "eval_ORGANIZATION_recall": 0.9367088607594937, "eval_PERSON_f1": 0.9840000000000001, "eval_PERSON_number": 124, "eval_PERSON_precision": 0.9761904761904762, "eval_PERSON_recall": 0.9919354838709677, "eval_loss": 0.039208512753248215, "eval_overall_accuracy": 0.9895690365083722, "eval_overall_f1": 0.9489414694894147, "eval_overall_precision": 0.9407407407407408, "eval_overall_recall": 0.957286432160804, "eval_runtime": 0.2423, "eval_samples_per_second": 701.592, "eval_steps_per_second": 12.381, "step": 4032 }, { "epoch": 43.0, "grad_norm": 0.29208576679229736, "learning_rate": 2.8499999999999998e-05, "loss": 0.0197, "step": 4128 }, { "epoch": 43.0, "eval_LOCATION_f1": 0.9316239316239315, "eval_LOCATION_number": 116, "eval_LOCATION_precision": 0.923728813559322, "eval_LOCATION_recall": 0.9396551724137931, "eval_ORGANIZATION_f1": 0.9274447949526813, "eval_ORGANIZATION_number": 158, "eval_ORGANIZATION_precision": 0.9245283018867925, "eval_ORGANIZATION_recall": 0.930379746835443, "eval_PERSON_f1": 0.9761904761904763, "eval_PERSON_number": 124, "eval_PERSON_precision": 0.9609375, "eval_PERSON_recall": 0.9919354838709677, "eval_loss": 0.03720787167549133, "eval_overall_accuracy": 0.9890200384298655, "eval_overall_f1": 0.9439601494396015, "eval_overall_precision": 0.9358024691358025, "eval_overall_recall": 0.9522613065326633, "eval_runtime": 0.242, "eval_samples_per_second": 702.453, "eval_steps_per_second": 12.396, "step": 4128 }, { "epoch": 44.0, "grad_norm": 0.3295332193374634, "learning_rate": 2.8000000000000003e-05, "loss": 0.022, "step": 4224 }, { "epoch": 44.0, "eval_LOCATION_f1": 0.9446808510638298, "eval_LOCATION_number": 116, "eval_LOCATION_precision": 0.9327731092436975, "eval_LOCATION_recall": 0.9568965517241379, "eval_ORGANIZATION_f1": 0.9177215189873418, "eval_ORGANIZATION_number": 158, "eval_ORGANIZATION_precision": 0.9177215189873418, "eval_ORGANIZATION_recall": 0.9177215189873418, "eval_PERSON_f1": 0.9800796812749005, "eval_PERSON_number": 124, "eval_PERSON_precision": 0.968503937007874, "eval_PERSON_recall": 0.9919354838709677, "eval_loss": 0.04005124792456627, "eval_overall_accuracy": 0.9884710403513588, "eval_overall_f1": 0.9451371571072318, "eval_overall_precision": 0.9381188118811881, "eval_overall_recall": 0.9522613065326633, "eval_runtime": 0.2427, "eval_samples_per_second": 700.36, "eval_steps_per_second": 12.359, "step": 4224 }, { "epoch": 45.0, "grad_norm": 1.0696682929992676, "learning_rate": 2.7500000000000004e-05, "loss": 0.0192, "step": 4320 }, { "epoch": 45.0, "eval_LOCATION_f1": 0.9406779661016949, "eval_LOCATION_number": 116, "eval_LOCATION_precision": 0.925, "eval_LOCATION_recall": 0.9568965517241379, "eval_ORGANIZATION_f1": 0.926517571884984, "eval_ORGANIZATION_number": 158, "eval_ORGANIZATION_precision": 0.9354838709677419, "eval_ORGANIZATION_recall": 0.9177215189873418, "eval_PERSON_f1": 0.9840000000000001, "eval_PERSON_number": 124, "eval_PERSON_precision": 0.9761904761904762, "eval_PERSON_recall": 0.9919354838709677, "eval_loss": 0.04148309305310249, "eval_overall_accuracy": 0.9887455393906122, "eval_overall_f1": 0.9486858573216519, "eval_overall_precision": 0.9451371571072319, "eval_overall_recall": 0.9522613065326633, "eval_runtime": 0.2424, "eval_samples_per_second": 701.317, "eval_steps_per_second": 12.376, "step": 4320 }, { "epoch": 46.0, "grad_norm": 0.5310882925987244, "learning_rate": 2.7000000000000002e-05, "loss": 0.0197, "step": 4416 }, { "epoch": 46.0, "eval_LOCATION_f1": 0.9456066945606694, "eval_LOCATION_number": 116, "eval_LOCATION_precision": 0.9186991869918699, "eval_LOCATION_recall": 0.9741379310344828, "eval_ORGANIZATION_f1": 0.9274447949526813, "eval_ORGANIZATION_number": 158, "eval_ORGANIZATION_precision": 0.9245283018867925, "eval_ORGANIZATION_recall": 0.930379746835443, "eval_PERSON_f1": 0.9840000000000001, "eval_PERSON_number": 124, "eval_PERSON_precision": 0.9761904761904762, "eval_PERSON_recall": 0.9919354838709677, "eval_loss": 0.03862782195210457, "eval_overall_accuracy": 0.990118034586879, "eval_overall_f1": 0.9503722084367245, "eval_overall_precision": 0.9387254901960784, "eval_overall_recall": 0.9623115577889447, "eval_runtime": 0.2435, "eval_samples_per_second": 698.028, "eval_steps_per_second": 12.318, "step": 4416 }, { "epoch": 47.0, "grad_norm": 0.36547964811325073, "learning_rate": 2.6500000000000004e-05, "loss": 0.02, "step": 4512 }, { "epoch": 47.0, "eval_LOCATION_f1": 0.944206008583691, "eval_LOCATION_number": 116, "eval_LOCATION_precision": 0.9401709401709402, "eval_LOCATION_recall": 0.9482758620689655, "eval_ORGANIZATION_f1": 0.940809968847352, "eval_ORGANIZATION_number": 158, "eval_ORGANIZATION_precision": 0.9263803680981595, "eval_ORGANIZATION_recall": 0.9556962025316456, "eval_PERSON_f1": 0.9800796812749005, "eval_PERSON_number": 124, "eval_PERSON_precision": 0.968503937007874, "eval_PERSON_recall": 0.9919354838709677, "eval_loss": 0.042170971632003784, "eval_overall_accuracy": 0.9892945374691189, "eval_overall_f1": 0.9540372670807453, "eval_overall_precision": 0.9434889434889435, "eval_overall_recall": 0.964824120603015, "eval_runtime": 0.2438, "eval_samples_per_second": 697.197, "eval_steps_per_second": 12.303, "step": 4512 }, { "epoch": 48.0, "grad_norm": 0.4364250600337982, "learning_rate": 2.6000000000000002e-05, "loss": 0.0192, "step": 4608 }, { "epoch": 48.0, "eval_LOCATION_f1": 0.9411764705882353, "eval_LOCATION_number": 116, "eval_LOCATION_precision": 0.9180327868852459, "eval_LOCATION_recall": 0.9655172413793104, "eval_ORGANIZATION_f1": 0.923076923076923, "eval_ORGANIZATION_number": 158, "eval_ORGANIZATION_precision": 0.935064935064935, "eval_ORGANIZATION_recall": 0.9113924050632911, "eval_PERSON_f1": 0.9879518072289156, "eval_PERSON_number": 124, "eval_PERSON_precision": 0.984, "eval_PERSON_recall": 0.9919354838709677, "eval_loss": 0.03884365037083626, "eval_overall_accuracy": 0.9879220422728521, "eval_overall_f1": 0.9486858573216519, "eval_overall_precision": 0.9451371571072319, "eval_overall_recall": 0.9522613065326633, "eval_runtime": 0.2413, "eval_samples_per_second": 704.424, "eval_steps_per_second": 12.431, "step": 4608 }, { "epoch": 49.0, "grad_norm": 0.6926938891410828, "learning_rate": 2.5500000000000003e-05, "loss": 0.0182, "step": 4704 }, { "epoch": 49.0, "eval_LOCATION_f1": 0.9535864978902953, "eval_LOCATION_number": 116, "eval_LOCATION_precision": 0.9338842975206612, "eval_LOCATION_recall": 0.9741379310344828, "eval_ORGANIZATION_f1": 0.9430379746835443, "eval_ORGANIZATION_number": 158, "eval_ORGANIZATION_precision": 0.9430379746835443, "eval_ORGANIZATION_recall": 0.9430379746835443, "eval_PERSON_f1": 0.9879518072289156, "eval_PERSON_number": 124, "eval_PERSON_precision": 0.984, "eval_PERSON_recall": 0.9919354838709677, "eval_loss": 0.04192095994949341, "eval_overall_accuracy": 0.9895690365083722, "eval_overall_f1": 0.9600997506234414, "eval_overall_precision": 0.9529702970297029, "eval_overall_recall": 0.9673366834170855, "eval_runtime": 0.2413, "eval_samples_per_second": 704.587, "eval_steps_per_second": 12.434, "step": 4704 }, { "epoch": 50.0, "grad_norm": 0.5129674673080444, "learning_rate": 2.5e-05, "loss": 0.0182, "step": 4800 }, { "epoch": 50.0, "eval_LOCATION_f1": 0.9491525423728815, "eval_LOCATION_number": 116, "eval_LOCATION_precision": 0.9333333333333333, "eval_LOCATION_recall": 0.9655172413793104, "eval_ORGANIZATION_f1": 0.9142857142857144, "eval_ORGANIZATION_number": 158, "eval_ORGANIZATION_precision": 0.9171974522292994, "eval_ORGANIZATION_recall": 0.9113924050632911, "eval_PERSON_f1": 0.9800796812749005, "eval_PERSON_number": 124, "eval_PERSON_precision": 0.968503937007874, "eval_PERSON_recall": 0.9919354838709677, "eval_loss": 0.04355218634009361, "eval_overall_accuracy": 0.9881965413121054, "eval_overall_f1": 0.9451371571072318, "eval_overall_precision": 0.9381188118811881, "eval_overall_recall": 0.9522613065326633, "eval_runtime": 0.2421, "eval_samples_per_second": 702.06, "eval_steps_per_second": 12.389, "step": 4800 }, { "epoch": 51.0, "grad_norm": 0.3724958598613739, "learning_rate": 2.45e-05, "loss": 0.0196, "step": 4896 }, { "epoch": 51.0, "eval_LOCATION_f1": 0.9367088607594937, "eval_LOCATION_number": 116, "eval_LOCATION_precision": 0.9173553719008265, "eval_LOCATION_recall": 0.9568965517241379, "eval_ORGANIZATION_f1": 0.9294871794871796, "eval_ORGANIZATION_number": 158, "eval_ORGANIZATION_precision": 0.9415584415584416, "eval_ORGANIZATION_recall": 0.9177215189873418, "eval_PERSON_f1": 0.9761904761904763, "eval_PERSON_number": 124, "eval_PERSON_precision": 0.9609375, "eval_PERSON_recall": 0.9919354838709677, "eval_loss": 0.04640508443117142, "eval_overall_accuracy": 0.9876475432335987, "eval_overall_f1": 0.9463171036204745, "eval_overall_precision": 0.9404466501240695, "eval_overall_recall": 0.9522613065326633, "eval_runtime": 0.2424, "eval_samples_per_second": 701.373, "eval_steps_per_second": 12.377, "step": 4896 }, { "epoch": 52.0, "grad_norm": 0.4651976525783539, "learning_rate": 2.4e-05, "loss": 0.016, "step": 4992 }, { "epoch": 52.0, "eval_LOCATION_f1": 0.9288702928870294, "eval_LOCATION_number": 116, "eval_LOCATION_precision": 0.9024390243902439, "eval_LOCATION_recall": 0.9568965517241379, "eval_ORGANIZATION_f1": 0.923076923076923, "eval_ORGANIZATION_number": 158, "eval_ORGANIZATION_precision": 0.935064935064935, "eval_ORGANIZATION_recall": 0.9113924050632911, "eval_PERSON_f1": 0.9761904761904763, "eval_PERSON_number": 124, "eval_PERSON_precision": 0.9609375, "eval_PERSON_recall": 0.9919354838709677, "eval_loss": 0.04982294142246246, "eval_overall_accuracy": 0.987098545155092, "eval_overall_f1": 0.9414694894146949, "eval_overall_precision": 0.9333333333333333, "eval_overall_recall": 0.949748743718593, "eval_runtime": 0.2422, "eval_samples_per_second": 702.013, "eval_steps_per_second": 12.388, "step": 4992 }, { "epoch": 53.0, "grad_norm": 0.3692150413990021, "learning_rate": 2.35e-05, "loss": 0.0174, "step": 5088 }, { "epoch": 53.0, "eval_LOCATION_f1": 0.944206008583691, "eval_LOCATION_number": 116, "eval_LOCATION_precision": 0.9401709401709402, "eval_LOCATION_recall": 0.9482758620689655, "eval_ORGANIZATION_f1": 0.9426751592356688, "eval_ORGANIZATION_number": 158, "eval_ORGANIZATION_precision": 0.9487179487179487, "eval_ORGANIZATION_recall": 0.9367088607594937, "eval_PERSON_f1": 0.9761904761904763, "eval_PERSON_number": 124, "eval_PERSON_precision": 0.9609375, "eval_PERSON_recall": 0.9919354838709677, "eval_loss": 0.047746025025844574, "eval_overall_accuracy": 0.9887455393906122, "eval_overall_f1": 0.9536921151439299, "eval_overall_precision": 0.9501246882793017, "eval_overall_recall": 0.957286432160804, "eval_runtime": 0.2418, "eval_samples_per_second": 703.203, "eval_steps_per_second": 12.409, "step": 5088 }, { "epoch": 54.0, "grad_norm": 2.322037935256958, "learning_rate": 2.3000000000000003e-05, "loss": 0.0156, "step": 5184 }, { "epoch": 54.0, "eval_LOCATION_f1": 0.944206008583691, "eval_LOCATION_number": 116, "eval_LOCATION_precision": 0.9401709401709402, "eval_LOCATION_recall": 0.9482758620689655, "eval_ORGANIZATION_f1": 0.9363057324840764, "eval_ORGANIZATION_number": 158, "eval_ORGANIZATION_precision": 0.9423076923076923, "eval_ORGANIZATION_recall": 0.930379746835443, "eval_PERSON_f1": 0.9800796812749005, "eval_PERSON_number": 124, "eval_PERSON_precision": 0.968503937007874, "eval_PERSON_recall": 0.9919354838709677, "eval_loss": 0.05073067173361778, "eval_overall_accuracy": 0.9881965413121054, "eval_overall_f1": 0.9523809523809523, "eval_overall_precision": 0.95, "eval_overall_recall": 0.9547738693467337, "eval_runtime": 0.2418, "eval_samples_per_second": 703.172, "eval_steps_per_second": 12.409, "step": 5184 }, { "epoch": 55.0, "grad_norm": 0.8182074427604675, "learning_rate": 2.25e-05, "loss": 0.0161, "step": 5280 }, { "epoch": 55.0, "eval_LOCATION_f1": 0.944206008583691, "eval_LOCATION_number": 116, "eval_LOCATION_precision": 0.9401709401709402, "eval_LOCATION_recall": 0.9482758620689655, "eval_ORGANIZATION_f1": 0.9235668789808917, "eval_ORGANIZATION_number": 158, "eval_ORGANIZATION_precision": 0.9294871794871795, "eval_ORGANIZATION_recall": 0.9177215189873418, "eval_PERSON_f1": 0.9800796812749005, "eval_PERSON_number": 124, "eval_PERSON_precision": 0.968503937007874, "eval_PERSON_recall": 0.9919354838709677, "eval_loss": 0.04936642944812775, "eval_overall_accuracy": 0.9887455393906122, "eval_overall_f1": 0.9473684210526316, "eval_overall_precision": 0.945, "eval_overall_recall": 0.949748743718593, "eval_runtime": 0.2422, "eval_samples_per_second": 701.981, "eval_steps_per_second": 12.388, "step": 5280 }, { "epoch": 56.0, "grad_norm": 0.47536519169807434, "learning_rate": 2.2000000000000003e-05, "loss": 0.0154, "step": 5376 }, { "epoch": 56.0, "eval_LOCATION_f1": 0.9322033898305084, "eval_LOCATION_number": 116, "eval_LOCATION_precision": 0.9166666666666666, "eval_LOCATION_recall": 0.9482758620689655, "eval_ORGANIZATION_f1": 0.9177215189873418, "eval_ORGANIZATION_number": 158, "eval_ORGANIZATION_precision": 0.9177215189873418, "eval_ORGANIZATION_recall": 0.9177215189873418, "eval_PERSON_f1": 0.9840000000000001, "eval_PERSON_number": 124, "eval_PERSON_precision": 0.9761904761904762, "eval_PERSON_recall": 0.9919354838709677, "eval_loss": 0.04633556678891182, "eval_overall_accuracy": 0.9884710403513588, "eval_overall_f1": 0.9426433915211971, "eval_overall_precision": 0.9356435643564357, "eval_overall_recall": 0.949748743718593, "eval_runtime": 0.2421, "eval_samples_per_second": 702.149, "eval_steps_per_second": 12.391, "step": 5376 }, { "epoch": 57.0, "grad_norm": 0.4734033942222595, "learning_rate": 2.15e-05, "loss": 0.0159, "step": 5472 }, { "epoch": 57.0, "eval_LOCATION_f1": 0.9482758620689655, "eval_LOCATION_number": 116, "eval_LOCATION_precision": 0.9482758620689655, "eval_LOCATION_recall": 0.9482758620689655, "eval_ORGANIZATION_f1": 0.9245283018867925, "eval_ORGANIZATION_number": 158, "eval_ORGANIZATION_precision": 0.91875, "eval_ORGANIZATION_recall": 0.930379746835443, "eval_PERSON_f1": 0.9840000000000001, "eval_PERSON_number": 124, "eval_PERSON_precision": 0.9761904761904762, "eval_PERSON_recall": 0.9919354838709677, "eval_loss": 0.04754474759101868, "eval_overall_accuracy": 0.9881965413121054, "eval_overall_f1": 0.95, "eval_overall_precision": 0.945273631840796, "eval_overall_recall": 0.9547738693467337, "eval_runtime": 0.2424, "eval_samples_per_second": 701.32, "eval_steps_per_second": 12.376, "step": 5472 }, { "epoch": 58.0, "grad_norm": 0.09098278731107712, "learning_rate": 2.1e-05, "loss": 0.0159, "step": 5568 }, { "epoch": 58.0, "eval_LOCATION_f1": 0.9327731092436975, "eval_LOCATION_number": 116, "eval_LOCATION_precision": 0.9098360655737705, "eval_LOCATION_recall": 0.9568965517241379, "eval_ORGANIZATION_f1": 0.9260450160771704, "eval_ORGANIZATION_number": 158, "eval_ORGANIZATION_precision": 0.9411764705882353, "eval_ORGANIZATION_recall": 0.9113924050632911, "eval_PERSON_f1": 0.9840000000000001, "eval_PERSON_number": 124, "eval_PERSON_precision": 0.9761904761904762, "eval_PERSON_recall": 0.9919354838709677, "eval_loss": 0.049943216145038605, "eval_overall_accuracy": 0.9873730441943454, "eval_overall_f1": 0.9461827284105131, "eval_overall_precision": 0.942643391521197, "eval_overall_recall": 0.949748743718593, "eval_runtime": 0.2423, "eval_samples_per_second": 701.712, "eval_steps_per_second": 12.383, "step": 5568 }, { "epoch": 59.0, "grad_norm": 0.28300827741622925, "learning_rate": 2.05e-05, "loss": 0.0154, "step": 5664 }, { "epoch": 59.0, "eval_LOCATION_f1": 0.9406779661016949, "eval_LOCATION_number": 116, "eval_LOCATION_precision": 0.925, "eval_LOCATION_recall": 0.9568965517241379, "eval_ORGANIZATION_f1": 0.926984126984127, "eval_ORGANIZATION_number": 158, "eval_ORGANIZATION_precision": 0.9299363057324841, "eval_ORGANIZATION_recall": 0.9240506329113924, "eval_PERSON_f1": 0.9800796812749005, "eval_PERSON_number": 124, "eval_PERSON_precision": 0.968503937007874, "eval_PERSON_recall": 0.9919354838709677, "eval_loss": 0.04638950154185295, "eval_overall_accuracy": 0.9881965413121054, "eval_overall_f1": 0.9476309226932669, "eval_overall_precision": 0.9405940594059405, "eval_overall_recall": 0.9547738693467337, "eval_runtime": 0.2422, "eval_samples_per_second": 701.998, "eval_steps_per_second": 12.388, "step": 5664 }, { "epoch": 60.0, "grad_norm": 0.24135783314704895, "learning_rate": 2e-05, "loss": 0.0146, "step": 5760 }, { "epoch": 60.0, "eval_LOCATION_f1": 0.9372384937238494, "eval_LOCATION_number": 116, "eval_LOCATION_precision": 0.9105691056910569, "eval_LOCATION_recall": 0.9655172413793104, "eval_ORGANIZATION_f1": 0.9396825396825397, "eval_ORGANIZATION_number": 158, "eval_ORGANIZATION_precision": 0.9426751592356688, "eval_ORGANIZATION_recall": 0.9367088607594937, "eval_PERSON_f1": 0.9800796812749005, "eval_PERSON_number": 124, "eval_PERSON_precision": 0.968503937007874, "eval_PERSON_recall": 0.9919354838709677, "eval_loss": 0.05022583156824112, "eval_overall_accuracy": 0.9881965413121054, "eval_overall_f1": 0.9515527950310558, "eval_overall_precision": 0.941031941031941, "eval_overall_recall": 0.9623115577889447, "eval_runtime": 0.2423, "eval_samples_per_second": 701.667, "eval_steps_per_second": 12.382, "step": 5760 }, { "epoch": 61.0, "grad_norm": 0.48841485381126404, "learning_rate": 1.9500000000000003e-05, "loss": 0.0164, "step": 5856 }, { "epoch": 61.0, "eval_LOCATION_f1": 0.9411764705882353, "eval_LOCATION_number": 116, "eval_LOCATION_precision": 0.9180327868852459, "eval_LOCATION_recall": 0.9655172413793104, "eval_ORGANIZATION_f1": 0.926984126984127, "eval_ORGANIZATION_number": 158, "eval_ORGANIZATION_precision": 0.9299363057324841, "eval_ORGANIZATION_recall": 0.9240506329113924, "eval_PERSON_f1": 0.9879518072289156, "eval_PERSON_number": 124, "eval_PERSON_precision": 0.984, "eval_PERSON_recall": 0.9919354838709677, "eval_loss": 0.047981929033994675, "eval_overall_accuracy": 0.9879220422728521, "eval_overall_f1": 0.9501246882793017, "eval_overall_precision": 0.943069306930693, "eval_overall_recall": 0.957286432160804, "eval_runtime": 0.2422, "eval_samples_per_second": 701.864, "eval_steps_per_second": 12.386, "step": 5856 }, { "epoch": 62.0, "grad_norm": 0.623166024684906, "learning_rate": 1.9e-05, "loss": 0.0126, "step": 5952 }, { "epoch": 62.0, "eval_LOCATION_f1": 0.925, "eval_LOCATION_number": 116, "eval_LOCATION_precision": 0.8951612903225806, "eval_LOCATION_recall": 0.9568965517241379, "eval_ORGANIZATION_f1": 0.9102564102564102, "eval_ORGANIZATION_number": 158, "eval_ORGANIZATION_precision": 0.922077922077922, "eval_ORGANIZATION_recall": 0.8987341772151899, "eval_PERSON_f1": 0.9840000000000001, "eval_PERSON_number": 124, "eval_PERSON_precision": 0.9761904761904762, "eval_PERSON_recall": 0.9919354838709677, "eval_loss": 0.05383405089378357, "eval_overall_accuracy": 0.987098545155092, "eval_overall_f1": 0.9376558603491272, "eval_overall_precision": 0.9306930693069307, "eval_overall_recall": 0.9447236180904522, "eval_runtime": 0.242, "eval_samples_per_second": 702.589, "eval_steps_per_second": 12.399, "step": 5952 }, { "epoch": 63.0, "grad_norm": 0.06195319816470146, "learning_rate": 1.85e-05, "loss": 0.0142, "step": 6048 }, { "epoch": 63.0, "eval_LOCATION_f1": 0.9572649572649573, "eval_LOCATION_number": 116, "eval_LOCATION_precision": 0.9491525423728814, "eval_LOCATION_recall": 0.9655172413793104, "eval_ORGANIZATION_f1": 0.9206349206349206, "eval_ORGANIZATION_number": 158, "eval_ORGANIZATION_precision": 0.9235668789808917, "eval_ORGANIZATION_recall": 0.9177215189873418, "eval_PERSON_f1": 0.9879518072289156, "eval_PERSON_number": 124, "eval_PERSON_precision": 0.984, "eval_PERSON_recall": 0.9919354838709677, "eval_loss": 0.050431687384843826, "eval_overall_accuracy": 0.9887455393906122, "eval_overall_f1": 0.9523809523809523, "eval_overall_precision": 0.95, "eval_overall_recall": 0.9547738693467337, "eval_runtime": 0.2441, "eval_samples_per_second": 696.509, "eval_steps_per_second": 12.291, "step": 6048 }, { "epoch": 64.0, "grad_norm": 0.38351964950561523, "learning_rate": 1.8e-05, "loss": 0.0131, "step": 6144 }, { "epoch": 64.0, "eval_LOCATION_f1": 0.9568965517241379, "eval_LOCATION_number": 116, "eval_LOCATION_precision": 0.9568965517241379, "eval_LOCATION_recall": 0.9568965517241379, "eval_ORGANIZATION_f1": 0.9463722397476341, "eval_ORGANIZATION_number": 158, "eval_ORGANIZATION_precision": 0.9433962264150944, "eval_ORGANIZATION_recall": 0.9493670886075949, "eval_PERSON_f1": 0.9800796812749005, "eval_PERSON_number": 124, "eval_PERSON_precision": 0.968503937007874, "eval_PERSON_recall": 0.9919354838709677, "eval_loss": 0.04740133136510849, "eval_overall_accuracy": 0.9890200384298655, "eval_overall_f1": 0.96, "eval_overall_precision": 0.9552238805970149, "eval_overall_recall": 0.964824120603015, "eval_runtime": 0.242, "eval_samples_per_second": 702.471, "eval_steps_per_second": 12.397, "step": 6144 }, { "epoch": 65.0, "grad_norm": 0.42032256722450256, "learning_rate": 1.75e-05, "loss": 0.0144, "step": 6240 }, { "epoch": 65.0, "eval_LOCATION_f1": 0.9451476793248945, "eval_LOCATION_number": 116, "eval_LOCATION_precision": 0.9256198347107438, "eval_LOCATION_recall": 0.9655172413793104, "eval_ORGANIZATION_f1": 0.926517571884984, "eval_ORGANIZATION_number": 158, "eval_ORGANIZATION_precision": 0.9354838709677419, "eval_ORGANIZATION_recall": 0.9177215189873418, "eval_PERSON_f1": 0.9799196787148594, "eval_PERSON_number": 124, "eval_PERSON_precision": 0.976, "eval_PERSON_recall": 0.9838709677419355, "eval_loss": 0.05012889206409454, "eval_overall_accuracy": 0.9876475432335987, "eval_overall_f1": 0.9486858573216519, "eval_overall_precision": 0.9451371571072319, "eval_overall_recall": 0.9522613065326633, "eval_runtime": 0.2428, "eval_samples_per_second": 700.183, "eval_steps_per_second": 12.356, "step": 6240 }, { "epoch": 66.0, "grad_norm": 0.6347458362579346, "learning_rate": 1.7000000000000003e-05, "loss": 0.0135, "step": 6336 }, { "epoch": 66.0, "eval_LOCATION_f1": 0.9446808510638298, "eval_LOCATION_number": 116, "eval_LOCATION_precision": 0.9327731092436975, "eval_LOCATION_recall": 0.9568965517241379, "eval_ORGANIZATION_f1": 0.9240506329113924, "eval_ORGANIZATION_number": 158, "eval_ORGANIZATION_precision": 0.9240506329113924, "eval_ORGANIZATION_recall": 0.9240506329113924, "eval_PERSON_f1": 0.9800796812749005, "eval_PERSON_number": 124, "eval_PERSON_precision": 0.968503937007874, "eval_PERSON_recall": 0.9919354838709677, "eval_loss": 0.05208972468972206, "eval_overall_accuracy": 0.9876475432335987, "eval_overall_f1": 0.9476309226932669, "eval_overall_precision": 0.9405940594059405, "eval_overall_recall": 0.9547738693467337, "eval_runtime": 0.2429, "eval_samples_per_second": 699.867, "eval_steps_per_second": 12.351, "step": 6336 }, { "epoch": 67.0, "grad_norm": 1.0222524404525757, "learning_rate": 1.65e-05, "loss": 0.0162, "step": 6432 }, { "epoch": 67.0, "eval_LOCATION_f1": 0.9406779661016949, "eval_LOCATION_number": 116, "eval_LOCATION_precision": 0.925, "eval_LOCATION_recall": 0.9568965517241379, "eval_ORGANIZATION_f1": 0.9201277955271565, "eval_ORGANIZATION_number": 158, "eval_ORGANIZATION_precision": 0.9290322580645162, "eval_ORGANIZATION_recall": 0.9113924050632911, "eval_PERSON_f1": 0.9800796812749005, "eval_PERSON_number": 124, "eval_PERSON_precision": 0.968503937007874, "eval_PERSON_recall": 0.9919354838709677, "eval_loss": 0.05340787023305893, "eval_overall_accuracy": 0.9862750480373319, "eval_overall_f1": 0.9450000000000001, "eval_overall_precision": 0.9402985074626866, "eval_overall_recall": 0.949748743718593, "eval_runtime": 0.2417, "eval_samples_per_second": 703.351, "eval_steps_per_second": 12.412, "step": 6432 }, { "epoch": 68.0, "grad_norm": 0.6841771006584167, "learning_rate": 1.6000000000000003e-05, "loss": 0.0136, "step": 6528 }, { "epoch": 68.0, "eval_LOCATION_f1": 0.9406779661016949, "eval_LOCATION_number": 116, "eval_LOCATION_precision": 0.925, "eval_LOCATION_recall": 0.9568965517241379, "eval_ORGANIZATION_f1": 0.9363057324840764, "eval_ORGANIZATION_number": 158, "eval_ORGANIZATION_precision": 0.9423076923076923, "eval_ORGANIZATION_recall": 0.930379746835443, "eval_PERSON_f1": 0.9840000000000001, "eval_PERSON_number": 124, "eval_PERSON_precision": 0.9761904761904762, "eval_PERSON_recall": 0.9919354838709677, "eval_loss": 0.05373825877904892, "eval_overall_accuracy": 0.9881965413121054, "eval_overall_f1": 0.9525, "eval_overall_precision": 0.9477611940298507, "eval_overall_recall": 0.957286432160804, "eval_runtime": 0.2419, "eval_samples_per_second": 702.784, "eval_steps_per_second": 12.402, "step": 6528 }, { "epoch": 69.0, "grad_norm": 1.1261268854141235, "learning_rate": 1.55e-05, "loss": 0.0138, "step": 6624 }, { "epoch": 69.0, "eval_LOCATION_f1": 0.9361702127659575, "eval_LOCATION_number": 116, "eval_LOCATION_precision": 0.9243697478991597, "eval_LOCATION_recall": 0.9482758620689655, "eval_ORGANIZATION_f1": 0.9363057324840764, "eval_ORGANIZATION_number": 158, "eval_ORGANIZATION_precision": 0.9423076923076923, "eval_ORGANIZATION_recall": 0.930379746835443, "eval_PERSON_f1": 0.9840000000000001, "eval_PERSON_number": 124, "eval_PERSON_precision": 0.9761904761904762, "eval_PERSON_recall": 0.9919354838709677, "eval_loss": 0.05131537467241287, "eval_overall_accuracy": 0.9887455393906122, "eval_overall_f1": 0.951188986232791, "eval_overall_precision": 0.9476309226932669, "eval_overall_recall": 0.9547738693467337, "eval_runtime": 0.2421, "eval_samples_per_second": 702.112, "eval_steps_per_second": 12.39, "step": 6624 }, { "epoch": 70.0, "grad_norm": 0.47885391116142273, "learning_rate": 1.5e-05, "loss": 0.0135, "step": 6720 }, { "epoch": 70.0, "eval_LOCATION_f1": 0.9406779661016949, "eval_LOCATION_number": 116, "eval_LOCATION_precision": 0.925, "eval_LOCATION_recall": 0.9568965517241379, "eval_ORGANIZATION_f1": 0.926984126984127, "eval_ORGANIZATION_number": 158, "eval_ORGANIZATION_precision": 0.9299363057324841, "eval_ORGANIZATION_recall": 0.9240506329113924, "eval_PERSON_f1": 0.9800796812749005, "eval_PERSON_number": 124, "eval_PERSON_precision": 0.968503937007874, "eval_PERSON_recall": 0.9919354838709677, "eval_loss": 0.05541845038533211, "eval_overall_accuracy": 0.987098545155092, "eval_overall_f1": 0.9476309226932669, "eval_overall_precision": 0.9405940594059405, "eval_overall_recall": 0.9547738693467337, "eval_runtime": 0.2426, "eval_samples_per_second": 700.621, "eval_steps_per_second": 12.364, "step": 6720 }, { "epoch": 71.0, "grad_norm": 0.29839274287223816, "learning_rate": 1.45e-05, "loss": 0.0121, "step": 6816 }, { "epoch": 71.0, "eval_LOCATION_f1": 0.9482758620689655, "eval_LOCATION_number": 116, "eval_LOCATION_precision": 0.9482758620689655, "eval_LOCATION_recall": 0.9482758620689655, "eval_ORGANIZATION_f1": 0.9341692789968652, "eval_ORGANIZATION_number": 158, "eval_ORGANIZATION_precision": 0.9254658385093167, "eval_ORGANIZATION_recall": 0.9430379746835443, "eval_PERSON_f1": 0.9840000000000001, "eval_PERSON_number": 124, "eval_PERSON_precision": 0.9761904761904762, "eval_PERSON_recall": 0.9919354838709677, "eval_loss": 0.05237449333071709, "eval_overall_accuracy": 0.9884710403513588, "eval_overall_f1": 0.9538077403245941, "eval_overall_precision": 0.9478908188585607, "eval_overall_recall": 0.9597989949748744, "eval_runtime": 0.2432, "eval_samples_per_second": 698.886, "eval_steps_per_second": 12.333, "step": 6816 }, { "epoch": 72.0, "grad_norm": 1.4181568622589111, "learning_rate": 1.4000000000000001e-05, "loss": 0.0131, "step": 6912 }, { "epoch": 72.0, "eval_LOCATION_f1": 0.9406779661016949, "eval_LOCATION_number": 116, "eval_LOCATION_precision": 0.925, "eval_LOCATION_recall": 0.9568965517241379, "eval_ORGANIZATION_f1": 0.9235668789808917, "eval_ORGANIZATION_number": 158, "eval_ORGANIZATION_precision": 0.9294871794871795, "eval_ORGANIZATION_recall": 0.9177215189873418, "eval_PERSON_f1": 0.9800796812749005, "eval_PERSON_number": 124, "eval_PERSON_precision": 0.968503937007874, "eval_PERSON_recall": 0.9919354838709677, "eval_loss": 0.05246526002883911, "eval_overall_accuracy": 0.9881965413121054, "eval_overall_f1": 0.9463171036204745, "eval_overall_precision": 0.9404466501240695, "eval_overall_recall": 0.9522613065326633, "eval_runtime": 0.2421, "eval_samples_per_second": 702.097, "eval_steps_per_second": 12.39, "step": 6912 }, { "epoch": 73.0, "grad_norm": 0.5246819853782654, "learning_rate": 1.3500000000000001e-05, "loss": 0.0129, "step": 7008 }, { "epoch": 73.0, "eval_LOCATION_f1": 0.9322033898305084, "eval_LOCATION_number": 116, "eval_LOCATION_precision": 0.9166666666666666, "eval_LOCATION_recall": 0.9482758620689655, "eval_ORGANIZATION_f1": 0.926517571884984, "eval_ORGANIZATION_number": 158, "eval_ORGANIZATION_precision": 0.9354838709677419, "eval_ORGANIZATION_recall": 0.9177215189873418, "eval_PERSON_f1": 0.9721115537848605, "eval_PERSON_number": 124, "eval_PERSON_precision": 0.9606299212598425, "eval_PERSON_recall": 0.9838709677419355, "eval_loss": 0.05284268409013748, "eval_overall_accuracy": 0.9876475432335987, "eval_overall_f1": 0.9425, "eval_overall_precision": 0.9378109452736318, "eval_overall_recall": 0.9472361809045227, "eval_runtime": 0.2425, "eval_samples_per_second": 701.026, "eval_steps_per_second": 12.371, "step": 7008 }, { "epoch": 74.0, "grad_norm": 0.1629040539264679, "learning_rate": 1.3000000000000001e-05, "loss": 0.0118, "step": 7104 }, { "epoch": 74.0, "eval_LOCATION_f1": 0.9361702127659575, "eval_LOCATION_number": 116, "eval_LOCATION_precision": 0.9243697478991597, "eval_LOCATION_recall": 0.9482758620689655, "eval_ORGANIZATION_f1": 0.9329073482428115, "eval_ORGANIZATION_number": 158, "eval_ORGANIZATION_precision": 0.9419354838709677, "eval_ORGANIZATION_recall": 0.9240506329113924, "eval_PERSON_f1": 0.9721115537848605, "eval_PERSON_number": 124, "eval_PERSON_precision": 0.9606299212598425, "eval_PERSON_recall": 0.9838709677419355, "eval_loss": 0.05083697289228439, "eval_overall_accuracy": 0.9884710403513588, "eval_overall_f1": 0.9461827284105131, "eval_overall_precision": 0.942643391521197, "eval_overall_recall": 0.949748743718593, "eval_runtime": 0.2416, "eval_samples_per_second": 703.535, "eval_steps_per_second": 12.415, "step": 7104 }, { "epoch": 75.0, "grad_norm": 0.34347105026245117, "learning_rate": 1.25e-05, "loss": 0.0109, "step": 7200 }, { "epoch": 75.0, "eval_LOCATION_f1": 0.9367088607594937, "eval_LOCATION_number": 116, "eval_LOCATION_precision": 0.9173553719008265, "eval_LOCATION_recall": 0.9568965517241379, "eval_ORGANIZATION_f1": 0.926517571884984, "eval_ORGANIZATION_number": 158, "eval_ORGANIZATION_precision": 0.9354838709677419, "eval_ORGANIZATION_recall": 0.9177215189873418, "eval_PERSON_f1": 0.9682539682539683, "eval_PERSON_number": 124, "eval_PERSON_precision": 0.953125, "eval_PERSON_recall": 0.9838709677419355, "eval_loss": 0.053751371800899506, "eval_overall_accuracy": 0.9881965413121054, "eval_overall_f1": 0.9426433915211971, "eval_overall_precision": 0.9356435643564357, "eval_overall_recall": 0.949748743718593, "eval_runtime": 0.2421, "eval_samples_per_second": 702.067, "eval_steps_per_second": 12.389, "step": 7200 }, { "epoch": 76.0, "grad_norm": 0.0426780991256237, "learning_rate": 1.2e-05, "loss": 0.0115, "step": 7296 }, { "epoch": 76.0, "eval_LOCATION_f1": 0.9367088607594937, "eval_LOCATION_number": 116, "eval_LOCATION_precision": 0.9173553719008265, "eval_LOCATION_recall": 0.9568965517241379, "eval_ORGANIZATION_f1": 0.9294871794871796, "eval_ORGANIZATION_number": 158, "eval_ORGANIZATION_precision": 0.9415584415584416, "eval_ORGANIZATION_recall": 0.9177215189873418, "eval_PERSON_f1": 0.9682539682539683, "eval_PERSON_number": 124, "eval_PERSON_precision": 0.953125, "eval_PERSON_recall": 0.9838709677419355, "eval_loss": 0.05429477617144585, "eval_overall_accuracy": 0.9881965413121054, "eval_overall_f1": 0.9438202247191011, "eval_overall_precision": 0.9379652605459057, "eval_overall_recall": 0.949748743718593, "eval_runtime": 0.2446, "eval_samples_per_second": 695.028, "eval_steps_per_second": 12.265, "step": 7296 }, { "epoch": 77.0, "grad_norm": 0.332469642162323, "learning_rate": 1.1500000000000002e-05, "loss": 0.0121, "step": 7392 }, { "epoch": 77.0, "eval_LOCATION_f1": 0.9367088607594937, "eval_LOCATION_number": 116, "eval_LOCATION_precision": 0.9173553719008265, "eval_LOCATION_recall": 0.9568965517241379, "eval_ORGANIZATION_f1": 0.9201277955271565, "eval_ORGANIZATION_number": 158, "eval_ORGANIZATION_precision": 0.9290322580645162, "eval_ORGANIZATION_recall": 0.9113924050632911, "eval_PERSON_f1": 0.9721115537848605, "eval_PERSON_number": 124, "eval_PERSON_precision": 0.9606299212598425, "eval_PERSON_recall": 0.9838709677419355, "eval_loss": 0.05492376908659935, "eval_overall_accuracy": 0.9873730441943454, "eval_overall_f1": 0.9413233458177278, "eval_overall_precision": 0.9354838709677419, "eval_overall_recall": 0.9472361809045227, "eval_runtime": 0.242, "eval_samples_per_second": 702.433, "eval_steps_per_second": 12.396, "step": 7392 }, { "epoch": 78.0, "grad_norm": 0.5249147415161133, "learning_rate": 1.1000000000000001e-05, "loss": 0.0116, "step": 7488 }, { "epoch": 78.0, "eval_LOCATION_f1": 0.9367088607594937, "eval_LOCATION_number": 116, "eval_LOCATION_precision": 0.9173553719008265, "eval_LOCATION_recall": 0.9568965517241379, "eval_ORGANIZATION_f1": 0.9044585987261147, "eval_ORGANIZATION_number": 158, "eval_ORGANIZATION_precision": 0.9102564102564102, "eval_ORGANIZATION_recall": 0.8987341772151899, "eval_PERSON_f1": 0.9721115537848605, "eval_PERSON_number": 124, "eval_PERSON_precision": 0.9606299212598425, "eval_PERSON_recall": 0.9838709677419355, "eval_loss": 0.05314483493566513, "eval_overall_accuracy": 0.9862750480373319, "eval_overall_f1": 0.9351620947630923, "eval_overall_precision": 0.9282178217821783, "eval_overall_recall": 0.9422110552763819, "eval_runtime": 0.2432, "eval_samples_per_second": 698.87, "eval_steps_per_second": 12.333, "step": 7488 }, { "epoch": 79.0, "grad_norm": 0.028825916349887848, "learning_rate": 1.05e-05, "loss": 0.0131, "step": 7584 }, { "epoch": 79.0, "eval_LOCATION_f1": 0.944206008583691, "eval_LOCATION_number": 116, "eval_LOCATION_precision": 0.9401709401709402, "eval_LOCATION_recall": 0.9482758620689655, "eval_ORGANIZATION_f1": 0.9526813880126183, "eval_ORGANIZATION_number": 158, "eval_ORGANIZATION_precision": 0.949685534591195, "eval_ORGANIZATION_recall": 0.9556962025316456, "eval_PERSON_f1": 0.9800796812749005, "eval_PERSON_number": 124, "eval_PERSON_precision": 0.968503937007874, "eval_PERSON_recall": 0.9919354838709677, "eval_loss": 0.04911971837282181, "eval_overall_accuracy": 0.9890200384298655, "eval_overall_f1": 0.958801498127341, "eval_overall_precision": 0.9528535980148883, "eval_overall_recall": 0.964824120603015, "eval_runtime": 0.2435, "eval_samples_per_second": 698.29, "eval_steps_per_second": 12.323, "step": 7584 }, { "epoch": 80.0, "grad_norm": 0.19487972557544708, "learning_rate": 1e-05, "loss": 0.0113, "step": 7680 }, { "epoch": 80.0, "eval_LOCATION_f1": 0.9482758620689655, "eval_LOCATION_number": 116, "eval_LOCATION_precision": 0.9482758620689655, "eval_LOCATION_recall": 0.9482758620689655, "eval_ORGANIZATION_f1": 0.9085173501577287, "eval_ORGANIZATION_number": 158, "eval_ORGANIZATION_precision": 0.9056603773584906, "eval_ORGANIZATION_recall": 0.9113924050632911, "eval_PERSON_f1": 0.9761904761904763, "eval_PERSON_number": 124, "eval_PERSON_precision": 0.9609375, "eval_PERSON_recall": 0.9919354838709677, "eval_loss": 0.05024532973766327, "eval_overall_accuracy": 0.9873730441943454, "eval_overall_f1": 0.9413233458177278, "eval_overall_precision": 0.9354838709677419, "eval_overall_recall": 0.9472361809045227, "eval_runtime": 0.2425, "eval_samples_per_second": 701.107, "eval_steps_per_second": 12.372, "step": 7680 }, { "epoch": 81.0, "grad_norm": 0.2933664619922638, "learning_rate": 9.5e-06, "loss": 0.0114, "step": 7776 }, { "epoch": 81.0, "eval_LOCATION_f1": 0.9487179487179486, "eval_LOCATION_number": 116, "eval_LOCATION_precision": 0.940677966101695, "eval_LOCATION_recall": 0.9568965517241379, "eval_ORGANIZATION_f1": 0.9142857142857144, "eval_ORGANIZATION_number": 158, "eval_ORGANIZATION_precision": 0.9171974522292994, "eval_ORGANIZATION_recall": 0.9113924050632911, "eval_PERSON_f1": 0.9800796812749005, "eval_PERSON_number": 124, "eval_PERSON_precision": 0.968503937007874, "eval_PERSON_recall": 0.9919354838709677, "eval_loss": 0.050492897629737854, "eval_overall_accuracy": 0.9881965413121054, "eval_overall_f1": 0.9450000000000001, "eval_overall_precision": 0.9402985074626866, "eval_overall_recall": 0.949748743718593, "eval_runtime": 0.245, "eval_samples_per_second": 693.863, "eval_steps_per_second": 12.245, "step": 7776 }, { "epoch": 82.0, "grad_norm": 0.8371833562850952, "learning_rate": 9e-06, "loss": 0.0101, "step": 7872 }, { "epoch": 82.0, "eval_LOCATION_f1": 0.9446808510638298, "eval_LOCATION_number": 116, "eval_LOCATION_precision": 0.9327731092436975, "eval_LOCATION_recall": 0.9568965517241379, "eval_ORGANIZATION_f1": 0.9137380191693291, "eval_ORGANIZATION_number": 158, "eval_ORGANIZATION_precision": 0.9225806451612903, "eval_ORGANIZATION_recall": 0.9050632911392406, "eval_PERSON_f1": 0.9761904761904763, "eval_PERSON_number": 124, "eval_PERSON_precision": 0.9609375, "eval_PERSON_recall": 0.9919354838709677, "eval_loss": 0.05484500154852867, "eval_overall_accuracy": 0.987098545155092, "eval_overall_f1": 0.9425, "eval_overall_precision": 0.9378109452736318, "eval_overall_recall": 0.9472361809045227, "eval_runtime": 0.2414, "eval_samples_per_second": 704.348, "eval_steps_per_second": 12.43, "step": 7872 }, { "epoch": 83.0, "grad_norm": 0.3084019720554352, "learning_rate": 8.500000000000002e-06, "loss": 0.0098, "step": 7968 }, { "epoch": 83.0, "eval_LOCATION_f1": 0.9406779661016949, "eval_LOCATION_number": 116, "eval_LOCATION_precision": 0.925, "eval_LOCATION_recall": 0.9568965517241379, "eval_ORGANIZATION_f1": 0.910828025477707, "eval_ORGANIZATION_number": 158, "eval_ORGANIZATION_precision": 0.9166666666666666, "eval_ORGANIZATION_recall": 0.9050632911392406, "eval_PERSON_f1": 0.9721115537848605, "eval_PERSON_number": 124, "eval_PERSON_precision": 0.9606299212598425, "eval_PERSON_recall": 0.9838709677419355, "eval_loss": 0.0543341189622879, "eval_overall_accuracy": 0.987098545155092, "eval_overall_f1": 0.9388264669163546, "eval_overall_precision": 0.9330024813895782, "eval_overall_recall": 0.9447236180904522, "eval_runtime": 0.2426, "eval_samples_per_second": 700.604, "eval_steps_per_second": 12.364, "step": 7968 }, { "epoch": 84.0, "grad_norm": 0.04305460304021835, "learning_rate": 8.000000000000001e-06, "loss": 0.01, "step": 8064 }, { "epoch": 84.0, "eval_LOCATION_f1": 0.9527896995708154, "eval_LOCATION_number": 116, "eval_LOCATION_precision": 0.9487179487179487, "eval_LOCATION_recall": 0.9568965517241379, "eval_ORGANIZATION_f1": 0.9299363057324842, "eval_ORGANIZATION_number": 158, "eval_ORGANIZATION_precision": 0.9358974358974359, "eval_ORGANIZATION_recall": 0.9240506329113924, "eval_PERSON_f1": 0.9800796812749005, "eval_PERSON_number": 124, "eval_PERSON_precision": 0.968503937007874, "eval_PERSON_recall": 0.9919354838709677, "eval_loss": 0.054905395954847336, "eval_overall_accuracy": 0.9873730441943454, "eval_overall_f1": 0.9523809523809523, "eval_overall_precision": 0.95, "eval_overall_recall": 0.9547738693467337, "eval_runtime": 0.2424, "eval_samples_per_second": 701.305, "eval_steps_per_second": 12.376, "step": 8064 }, { "epoch": 85.0, "grad_norm": 0.7204985022544861, "learning_rate": 7.5e-06, "loss": 0.0106, "step": 8160 }, { "epoch": 85.0, "eval_LOCATION_f1": 0.9491525423728815, "eval_LOCATION_number": 116, "eval_LOCATION_precision": 0.9333333333333333, "eval_LOCATION_recall": 0.9655172413793104, "eval_ORGANIZATION_f1": 0.926984126984127, "eval_ORGANIZATION_number": 158, "eval_ORGANIZATION_precision": 0.9299363057324841, "eval_ORGANIZATION_recall": 0.9240506329113924, "eval_PERSON_f1": 0.9800796812749005, "eval_PERSON_number": 124, "eval_PERSON_precision": 0.968503937007874, "eval_PERSON_recall": 0.9919354838709677, "eval_loss": 0.05248566344380379, "eval_overall_accuracy": 0.9890200384298655, "eval_overall_f1": 0.9501246882793017, "eval_overall_precision": 0.943069306930693, "eval_overall_recall": 0.957286432160804, "eval_runtime": 0.2418, "eval_samples_per_second": 703.138, "eval_steps_per_second": 12.408, "step": 8160 }, { "epoch": 86.0, "grad_norm": 0.07470478117465973, "learning_rate": 7.000000000000001e-06, "loss": 0.0102, "step": 8256 }, { "epoch": 86.0, "eval_LOCATION_f1": 0.9487179487179486, "eval_LOCATION_number": 116, "eval_LOCATION_precision": 0.940677966101695, "eval_LOCATION_recall": 0.9568965517241379, "eval_ORGANIZATION_f1": 0.926984126984127, "eval_ORGANIZATION_number": 158, "eval_ORGANIZATION_precision": 0.9299363057324841, "eval_ORGANIZATION_recall": 0.9240506329113924, "eval_PERSON_f1": 0.976, "eval_PERSON_number": 124, "eval_PERSON_precision": 0.9682539682539683, "eval_PERSON_recall": 0.9838709677419355, "eval_loss": 0.05321876332163811, "eval_overall_accuracy": 0.9879220422728521, "eval_overall_f1": 0.9486858573216519, "eval_overall_precision": 0.9451371571072319, "eval_overall_recall": 0.9522613065326633, "eval_runtime": 0.2428, "eval_samples_per_second": 700.282, "eval_steps_per_second": 12.358, "step": 8256 }, { "epoch": 87.0, "grad_norm": 0.2286868691444397, "learning_rate": 6.5000000000000004e-06, "loss": 0.0092, "step": 8352 }, { "epoch": 87.0, "eval_LOCATION_f1": 0.9367088607594937, "eval_LOCATION_number": 116, "eval_LOCATION_precision": 0.9173553719008265, "eval_LOCATION_recall": 0.9568965517241379, "eval_ORGANIZATION_f1": 0.9206349206349206, "eval_ORGANIZATION_number": 158, "eval_ORGANIZATION_precision": 0.9235668789808917, "eval_ORGANIZATION_recall": 0.9177215189873418, "eval_PERSON_f1": 0.976, "eval_PERSON_number": 124, "eval_PERSON_precision": 0.9682539682539683, "eval_PERSON_recall": 0.9838709677419355, "eval_loss": 0.053863525390625, "eval_overall_accuracy": 0.9879220422728521, "eval_overall_f1": 0.9426433915211971, "eval_overall_precision": 0.9356435643564357, "eval_overall_recall": 0.949748743718593, "eval_runtime": 0.2431, "eval_samples_per_second": 699.324, "eval_steps_per_second": 12.341, "step": 8352 }, { "epoch": 88.0, "grad_norm": 0.19395892322063446, "learning_rate": 6e-06, "loss": 0.0095, "step": 8448 }, { "epoch": 88.0, "eval_LOCATION_f1": 0.9367088607594937, "eval_LOCATION_number": 116, "eval_LOCATION_precision": 0.9173553719008265, "eval_LOCATION_recall": 0.9568965517241379, "eval_ORGANIZATION_f1": 0.9299363057324842, "eval_ORGANIZATION_number": 158, "eval_ORGANIZATION_precision": 0.9358974358974359, "eval_ORGANIZATION_recall": 0.9240506329113924, "eval_PERSON_f1": 0.976, "eval_PERSON_number": 124, "eval_PERSON_precision": 0.9682539682539683, "eval_PERSON_recall": 0.9838709677419355, "eval_loss": 0.05385447293519974, "eval_overall_accuracy": 0.9873730441943454, "eval_overall_f1": 0.9463171036204745, "eval_overall_precision": 0.9404466501240695, "eval_overall_recall": 0.9522613065326633, "eval_runtime": 0.2425, "eval_samples_per_second": 700.995, "eval_steps_per_second": 12.37, "step": 8448 }, { "epoch": 89.0, "grad_norm": 0.5978826880455017, "learning_rate": 5.500000000000001e-06, "loss": 0.0099, "step": 8544 }, { "epoch": 89.0, "eval_LOCATION_f1": 0.9406779661016949, "eval_LOCATION_number": 116, "eval_LOCATION_precision": 0.925, "eval_LOCATION_recall": 0.9568965517241379, "eval_ORGANIZATION_f1": 0.9367088607594937, "eval_ORGANIZATION_number": 158, "eval_ORGANIZATION_precision": 0.9367088607594937, "eval_ORGANIZATION_recall": 0.9367088607594937, "eval_PERSON_f1": 0.9840000000000001, "eval_PERSON_number": 124, "eval_PERSON_precision": 0.9761904761904762, "eval_PERSON_recall": 0.9919354838709677, "eval_loss": 0.052636079490184784, "eval_overall_accuracy": 0.9890200384298655, "eval_overall_f1": 0.9526184538653367, "eval_overall_precision": 0.9455445544554455, "eval_overall_recall": 0.9597989949748744, "eval_runtime": 0.2422, "eval_samples_per_second": 702.032, "eval_steps_per_second": 12.389, "step": 8544 }, { "epoch": 90.0, "grad_norm": 0.17808915674686432, "learning_rate": 5e-06, "loss": 0.0095, "step": 8640 }, { "epoch": 90.0, "eval_LOCATION_f1": 0.9487179487179486, "eval_LOCATION_number": 116, "eval_LOCATION_precision": 0.940677966101695, "eval_LOCATION_recall": 0.9568965517241379, "eval_ORGANIZATION_f1": 0.9363057324840764, "eval_ORGANIZATION_number": 158, "eval_ORGANIZATION_precision": 0.9423076923076923, "eval_ORGANIZATION_recall": 0.930379746835443, "eval_PERSON_f1": 0.9800796812749005, "eval_PERSON_number": 124, "eval_PERSON_precision": 0.968503937007874, "eval_PERSON_recall": 0.9919354838709677, "eval_loss": 0.05316346138715744, "eval_overall_accuracy": 0.9884710403513588, "eval_overall_f1": 0.9536921151439299, "eval_overall_precision": 0.9501246882793017, "eval_overall_recall": 0.957286432160804, "eval_runtime": 0.2434, "eval_samples_per_second": 698.582, "eval_steps_per_second": 12.328, "step": 8640 }, { "epoch": 91.0, "grad_norm": 0.17433640360832214, "learning_rate": 4.5e-06, "loss": 0.0099, "step": 8736 }, { "epoch": 91.0, "eval_LOCATION_f1": 0.9406779661016949, "eval_LOCATION_number": 116, "eval_LOCATION_precision": 0.925, "eval_LOCATION_recall": 0.9568965517241379, "eval_ORGANIZATION_f1": 0.9299363057324842, "eval_ORGANIZATION_number": 158, "eval_ORGANIZATION_precision": 0.9358974358974359, "eval_ORGANIZATION_recall": 0.9240506329113924, "eval_PERSON_f1": 0.9840000000000001, "eval_PERSON_number": 124, "eval_PERSON_precision": 0.9761904761904762, "eval_PERSON_recall": 0.9919354838709677, "eval_loss": 0.052069030702114105, "eval_overall_accuracy": 0.9887455393906122, "eval_overall_f1": 0.95, "eval_overall_precision": 0.945273631840796, "eval_overall_recall": 0.9547738693467337, "eval_runtime": 0.2421, "eval_samples_per_second": 702.241, "eval_steps_per_second": 12.392, "step": 8736 }, { "epoch": 92.0, "grad_norm": 0.0391317717730999, "learning_rate": 4.000000000000001e-06, "loss": 0.0095, "step": 8832 }, { "epoch": 92.0, "eval_LOCATION_f1": 0.9406779661016949, "eval_LOCATION_number": 116, "eval_LOCATION_precision": 0.925, "eval_LOCATION_recall": 0.9568965517241379, "eval_ORGANIZATION_f1": 0.9240506329113924, "eval_ORGANIZATION_number": 158, "eval_ORGANIZATION_precision": 0.9240506329113924, "eval_ORGANIZATION_recall": 0.9240506329113924, "eval_PERSON_f1": 0.976, "eval_PERSON_number": 124, "eval_PERSON_precision": 0.9682539682539683, "eval_PERSON_recall": 0.9838709677419355, "eval_loss": 0.05470087379217148, "eval_overall_accuracy": 0.9879220422728521, "eval_overall_f1": 0.9451371571072318, "eval_overall_precision": 0.9381188118811881, "eval_overall_recall": 0.9522613065326633, "eval_runtime": 0.2418, "eval_samples_per_second": 702.995, "eval_steps_per_second": 12.406, "step": 8832 }, { "epoch": 93.0, "grad_norm": 1.2939667701721191, "learning_rate": 3.5000000000000004e-06, "loss": 0.0096, "step": 8928 }, { "epoch": 93.0, "eval_LOCATION_f1": 0.9487179487179486, "eval_LOCATION_number": 116, "eval_LOCATION_precision": 0.940677966101695, "eval_LOCATION_recall": 0.9568965517241379, "eval_ORGANIZATION_f1": 0.9299363057324842, "eval_ORGANIZATION_number": 158, "eval_ORGANIZATION_precision": 0.9358974358974359, "eval_ORGANIZATION_recall": 0.9240506329113924, "eval_PERSON_f1": 0.9721115537848605, "eval_PERSON_number": 124, "eval_PERSON_precision": 0.9606299212598425, "eval_PERSON_recall": 0.9838709677419355, "eval_loss": 0.05360059067606926, "eval_overall_accuracy": 0.9884710403513588, "eval_overall_f1": 0.9486858573216519, "eval_overall_precision": 0.9451371571072319, "eval_overall_recall": 0.9522613065326633, "eval_runtime": 0.2419, "eval_samples_per_second": 702.744, "eval_steps_per_second": 12.401, "step": 8928 }, { "epoch": 94.0, "grad_norm": 1.3997987508773804, "learning_rate": 3e-06, "loss": 0.009, "step": 9024 }, { "epoch": 94.0, "eval_LOCATION_f1": 0.9446808510638298, "eval_LOCATION_number": 116, "eval_LOCATION_precision": 0.9327731092436975, "eval_LOCATION_recall": 0.9568965517241379, "eval_ORGANIZATION_f1": 0.9235668789808917, "eval_ORGANIZATION_number": 158, "eval_ORGANIZATION_precision": 0.9294871794871795, "eval_ORGANIZATION_recall": 0.9177215189873418, "eval_PERSON_f1": 0.9800796812749005, "eval_PERSON_number": 124, "eval_PERSON_precision": 0.968503937007874, "eval_PERSON_recall": 0.9919354838709677, "eval_loss": 0.053766991943120956, "eval_overall_accuracy": 0.9884710403513588, "eval_overall_f1": 0.9475, "eval_overall_precision": 0.9427860696517413, "eval_overall_recall": 0.9522613065326633, "eval_runtime": 0.2419, "eval_samples_per_second": 702.867, "eval_steps_per_second": 12.404, "step": 9024 }, { "epoch": 95.0, "grad_norm": 0.015623769722878933, "learning_rate": 2.5e-06, "loss": 0.0094, "step": 9120 }, { "epoch": 95.0, "eval_LOCATION_f1": 0.9406779661016949, "eval_LOCATION_number": 116, "eval_LOCATION_precision": 0.925, "eval_LOCATION_recall": 0.9568965517241379, "eval_ORGANIZATION_f1": 0.926517571884984, "eval_ORGANIZATION_number": 158, "eval_ORGANIZATION_precision": 0.9354838709677419, "eval_ORGANIZATION_recall": 0.9177215189873418, "eval_PERSON_f1": 0.9840000000000001, "eval_PERSON_number": 124, "eval_PERSON_precision": 0.9761904761904762, "eval_PERSON_recall": 0.9919354838709677, "eval_loss": 0.05312187969684601, "eval_overall_accuracy": 0.9887455393906122, "eval_overall_f1": 0.9486858573216519, "eval_overall_precision": 0.9451371571072319, "eval_overall_recall": 0.9522613065326633, "eval_runtime": 0.2423, "eval_samples_per_second": 701.669, "eval_steps_per_second": 12.382, "step": 9120 }, { "epoch": 96.0, "grad_norm": 0.06812173873186111, "learning_rate": 2.0000000000000003e-06, "loss": 0.0083, "step": 9216 }, { "epoch": 96.0, "eval_LOCATION_f1": 0.9406779661016949, "eval_LOCATION_number": 116, "eval_LOCATION_precision": 0.925, "eval_LOCATION_recall": 0.9568965517241379, "eval_ORGANIZATION_f1": 0.9235668789808917, "eval_ORGANIZATION_number": 158, "eval_ORGANIZATION_precision": 0.9294871794871795, "eval_ORGANIZATION_recall": 0.9177215189873418, "eval_PERSON_f1": 0.9840000000000001, "eval_PERSON_number": 124, "eval_PERSON_precision": 0.9761904761904762, "eval_PERSON_recall": 0.9919354838709677, "eval_loss": 0.052705731242895126, "eval_overall_accuracy": 0.9887455393906122, "eval_overall_f1": 0.9475, "eval_overall_precision": 0.9427860696517413, "eval_overall_recall": 0.9522613065326633, "eval_runtime": 0.2425, "eval_samples_per_second": 701.06, "eval_steps_per_second": 12.372, "step": 9216 }, { "epoch": 97.0, "grad_norm": 0.13947905600070953, "learning_rate": 1.5e-06, "loss": 0.0099, "step": 9312 }, { "epoch": 97.0, "eval_LOCATION_f1": 0.9406779661016949, "eval_LOCATION_number": 116, "eval_LOCATION_precision": 0.925, "eval_LOCATION_recall": 0.9568965517241379, "eval_ORGANIZATION_f1": 0.926517571884984, "eval_ORGANIZATION_number": 158, "eval_ORGANIZATION_precision": 0.9354838709677419, "eval_ORGANIZATION_recall": 0.9177215189873418, "eval_PERSON_f1": 0.9840000000000001, "eval_PERSON_number": 124, "eval_PERSON_precision": 0.9761904761904762, "eval_PERSON_recall": 0.9919354838709677, "eval_loss": 0.05367732793092728, "eval_overall_accuracy": 0.9890200384298655, "eval_overall_f1": 0.9486858573216519, "eval_overall_precision": 0.9451371571072319, "eval_overall_recall": 0.9522613065326633, "eval_runtime": 0.2429, "eval_samples_per_second": 699.966, "eval_steps_per_second": 12.352, "step": 9312 }, { "epoch": 98.0, "grad_norm": 0.10114230960607529, "learning_rate": 1.0000000000000002e-06, "loss": 0.0078, "step": 9408 }, { "epoch": 98.0, "eval_LOCATION_f1": 0.9406779661016949, "eval_LOCATION_number": 116, "eval_LOCATION_precision": 0.925, "eval_LOCATION_recall": 0.9568965517241379, "eval_ORGANIZATION_f1": 0.926517571884984, "eval_ORGANIZATION_number": 158, "eval_ORGANIZATION_precision": 0.9354838709677419, "eval_ORGANIZATION_recall": 0.9177215189873418, "eval_PERSON_f1": 0.9840000000000001, "eval_PERSON_number": 124, "eval_PERSON_precision": 0.9761904761904762, "eval_PERSON_recall": 0.9919354838709677, "eval_loss": 0.05298721790313721, "eval_overall_accuracy": 0.9892945374691189, "eval_overall_f1": 0.9486858573216519, "eval_overall_precision": 0.9451371571072319, "eval_overall_recall": 0.9522613065326633, "eval_runtime": 0.2421, "eval_samples_per_second": 702.26, "eval_steps_per_second": 12.393, "step": 9408 }, { "epoch": 99.0, "grad_norm": 0.5689762234687805, "learning_rate": 5.000000000000001e-07, "loss": 0.0093, "step": 9504 }, { "epoch": 99.0, "eval_LOCATION_f1": 0.9406779661016949, "eval_LOCATION_number": 116, "eval_LOCATION_precision": 0.925, "eval_LOCATION_recall": 0.9568965517241379, "eval_ORGANIZATION_f1": 0.926517571884984, "eval_ORGANIZATION_number": 158, "eval_ORGANIZATION_precision": 0.9354838709677419, "eval_ORGANIZATION_recall": 0.9177215189873418, "eval_PERSON_f1": 0.9840000000000001, "eval_PERSON_number": 124, "eval_PERSON_precision": 0.9761904761904762, "eval_PERSON_recall": 0.9919354838709677, "eval_loss": 0.052819643169641495, "eval_overall_accuracy": 0.9892945374691189, "eval_overall_f1": 0.9486858573216519, "eval_overall_precision": 0.9451371571072319, "eval_overall_recall": 0.9522613065326633, "eval_runtime": 0.2426, "eval_samples_per_second": 700.726, "eval_steps_per_second": 12.366, "step": 9504 }, { "epoch": 100.0, "grad_norm": 0.09888800233602524, "learning_rate": 0.0, "loss": 0.0086, "step": 9600 }, { "epoch": 100.0, "eval_LOCATION_f1": 0.9406779661016949, "eval_LOCATION_number": 116, "eval_LOCATION_precision": 0.925, "eval_LOCATION_recall": 0.9568965517241379, "eval_ORGANIZATION_f1": 0.926517571884984, "eval_ORGANIZATION_number": 158, "eval_ORGANIZATION_precision": 0.9354838709677419, "eval_ORGANIZATION_recall": 0.9177215189873418, "eval_PERSON_f1": 0.9840000000000001, "eval_PERSON_number": 124, "eval_PERSON_precision": 0.9761904761904762, "eval_PERSON_recall": 0.9919354838709677, "eval_loss": 0.052767641842365265, "eval_overall_accuracy": 0.9895690365083722, "eval_overall_f1": 0.9486858573216519, "eval_overall_precision": 0.9451371571072319, "eval_overall_recall": 0.9522613065326633, "eval_runtime": 0.2425, "eval_samples_per_second": 701.096, "eval_steps_per_second": 12.372, "step": 9600 }, { "epoch": 100.0, "step": 9600, "total_flos": 4293597283743744.0, "train_loss": 0.04076442163437605, "train_runtime": 503.1696, "train_samples_per_second": 304.271, "train_steps_per_second": 19.079 } ], "logging_steps": 500, "max_steps": 9600, "num_input_tokens_seen": 0, "num_train_epochs": 100, "save_steps": 500, "total_flos": 4293597283743744.0, "train_batch_size": 16, "trial_name": null, "trial_params": null }