diff --git "a/trainer_state.json" "b/trainer_state.json" new file mode 100644--- /dev/null +++ "b/trainer_state.json" @@ -0,0 +1,3130 @@ +{ + "best_metric": null, + "best_model_checkpoint": null, + "epoch": 100.0, + "eval_steps": 500, + "global_step": 9600, + "is_hyper_param_search": false, + "is_local_process_zero": true, + "is_world_process_zero": true, + "log_history": [ + { + "epoch": 1.0, + "grad_norm": 1.0622260570526123, + "learning_rate": 4.9500000000000004e-05, + "loss": 0.8931, + "step": 96 + }, + { + "epoch": 1.0, + "eval_LOCATION_f1": 0.01694915254237288, + "eval_LOCATION_number": 116, + "eval_LOCATION_precision": 0.5, + "eval_LOCATION_recall": 0.008620689655172414, + "eval_ORGANIZATION_f1": 0.24025974025974026, + "eval_ORGANIZATION_number": 158, + "eval_ORGANIZATION_precision": 0.24666666666666667, + "eval_ORGANIZATION_recall": 0.23417721518987342, + "eval_PERSON_f1": 0.2660098522167488, + "eval_PERSON_number": 124, + "eval_PERSON_precision": 0.34177215189873417, + "eval_PERSON_recall": 0.21774193548387097, + "eval_loss": 0.402089387178421, + "eval_overall_accuracy": 0.8597309909415317, + "eval_overall_f1": 0.20667726550079493, + "eval_overall_precision": 0.2813852813852814, + "eval_overall_recall": 0.16331658291457288, + "eval_runtime": 0.2477, + "eval_samples_per_second": 686.279, + "eval_steps_per_second": 12.111, + "step": 96 + }, + { + "epoch": 2.0, + "grad_norm": 1.0000041723251343, + "learning_rate": 4.9e-05, + "loss": 0.3656, + "step": 192 + }, + { + "epoch": 2.0, + "eval_LOCATION_f1": 0.4267782426778242, + "eval_LOCATION_number": 116, + "eval_LOCATION_precision": 0.4146341463414634, + "eval_LOCATION_recall": 0.4396551724137931, + "eval_ORGANIZATION_f1": 0.5901639344262295, + "eval_ORGANIZATION_number": 158, + "eval_ORGANIZATION_precision": 0.6122448979591837, + "eval_ORGANIZATION_recall": 0.569620253164557, + "eval_PERSON_f1": 0.5222929936305734, + "eval_PERSON_number": 124, + "eval_PERSON_precision": 0.43157894736842106, + "eval_PERSON_recall": 0.6612903225806451, + "eval_loss": 0.21696880459785461, + "eval_overall_accuracy": 0.9264342574800988, + "eval_overall_f1": 0.5198135198135198, + "eval_overall_precision": 0.48478260869565215, + "eval_overall_recall": 0.5603015075376885, + "eval_runtime": 0.2423, + "eval_samples_per_second": 701.523, + "eval_steps_per_second": 12.38, + "step": 192 + }, + { + "epoch": 3.0, + "grad_norm": 0.8752551674842834, + "learning_rate": 4.85e-05, + "loss": 0.2175, + "step": 288 + }, + { + "epoch": 3.0, + "eval_LOCATION_f1": 0.7214611872146118, + "eval_LOCATION_number": 116, + "eval_LOCATION_precision": 0.7669902912621359, + "eval_LOCATION_recall": 0.6810344827586207, + "eval_ORGANIZATION_f1": 0.7411764705882353, + "eval_ORGANIZATION_number": 158, + "eval_ORGANIZATION_precision": 0.6923076923076923, + "eval_ORGANIZATION_recall": 0.7974683544303798, + "eval_PERSON_f1": 0.9416342412451362, + "eval_PERSON_number": 124, + "eval_PERSON_precision": 0.9097744360902256, + "eval_PERSON_recall": 0.9758064516129032, + "eval_loss": 0.11590560525655746, + "eval_overall_accuracy": 0.9648641229755696, + "eval_overall_f1": 0.7990196078431372, + "eval_overall_precision": 0.7799043062200957, + "eval_overall_recall": 0.8190954773869347, + "eval_runtime": 0.2421, + "eval_samples_per_second": 702.326, + "eval_steps_per_second": 12.394, + "step": 288 + }, + { + "epoch": 4.0, + "grad_norm": 1.105630874633789, + "learning_rate": 4.8e-05, + "loss": 0.152, + "step": 384 + }, + { + "epoch": 4.0, + "eval_LOCATION_f1": 0.8421052631578948, + "eval_LOCATION_number": 116, + "eval_LOCATION_precision": 0.7938931297709924, + "eval_LOCATION_recall": 0.896551724137931, + "eval_ORGANIZATION_f1": 0.812121212121212, + "eval_ORGANIZATION_number": 158, + "eval_ORGANIZATION_precision": 0.7790697674418605, + "eval_ORGANIZATION_recall": 0.8481012658227848, + "eval_PERSON_f1": 0.9647058823529411, + "eval_PERSON_number": 124, + "eval_PERSON_precision": 0.9389312977099237, + "eval_PERSON_recall": 0.9919354838709677, + "eval_loss": 0.08956436812877655, + "eval_overall_accuracy": 0.9706286027998902, + "eval_overall_f1": 0.8677884615384615, + "eval_overall_precision": 0.8317972350230415, + "eval_overall_recall": 0.907035175879397, + "eval_runtime": 0.243, + "eval_samples_per_second": 699.575, + "eval_steps_per_second": 12.345, + "step": 384 + }, + { + "epoch": 5.0, + "grad_norm": 0.8573193550109863, + "learning_rate": 4.75e-05, + "loss": 0.1153, + "step": 480 + }, + { + "epoch": 5.0, + "eval_LOCATION_f1": 0.8869565217391304, + "eval_LOCATION_number": 116, + "eval_LOCATION_precision": 0.8947368421052632, + "eval_LOCATION_recall": 0.8793103448275862, + "eval_ORGANIZATION_f1": 0.8492307692307692, + "eval_ORGANIZATION_number": 158, + "eval_ORGANIZATION_precision": 0.8263473053892215, + "eval_ORGANIZATION_recall": 0.8734177215189873, + "eval_PERSON_f1": 0.9721115537848605, + "eval_PERSON_number": 124, + "eval_PERSON_precision": 0.9606299212598425, + "eval_PERSON_recall": 0.9838709677419355, + "eval_loss": 0.06209466606378555, + "eval_overall_accuracy": 0.9777655778204777, + "eval_overall_f1": 0.8982630272952854, + "eval_overall_precision": 0.8872549019607843, + "eval_overall_recall": 0.9095477386934674, + "eval_runtime": 0.2426, + "eval_samples_per_second": 700.706, + "eval_steps_per_second": 12.365, + "step": 480 + }, + { + "epoch": 6.0, + "grad_norm": 2.2799108028411865, + "learning_rate": 4.7e-05, + "loss": 0.1017, + "step": 576 + }, + { + "epoch": 6.0, + "eval_LOCATION_f1": 0.8806584362139918, + "eval_LOCATION_number": 116, + "eval_LOCATION_precision": 0.84251968503937, + "eval_LOCATION_recall": 0.9224137931034483, + "eval_ORGANIZATION_f1": 0.8827160493827162, + "eval_ORGANIZATION_number": 158, + "eval_ORGANIZATION_precision": 0.8614457831325302, + "eval_ORGANIZATION_recall": 0.9050632911392406, + "eval_PERSON_f1": 0.9840000000000001, + "eval_PERSON_number": 124, + "eval_PERSON_precision": 0.9761904761904762, + "eval_PERSON_recall": 0.9919354838709677, + "eval_loss": 0.04618193209171295, + "eval_overall_accuracy": 0.9846280538018117, + "eval_overall_f1": 0.9130966952264383, + "eval_overall_precision": 0.8902147971360382, + "eval_overall_recall": 0.9371859296482412, + "eval_runtime": 0.2426, + "eval_samples_per_second": 700.771, + "eval_steps_per_second": 12.367, + "step": 576 + }, + { + "epoch": 7.0, + "grad_norm": 0.5819811820983887, + "learning_rate": 4.6500000000000005e-05, + "loss": 0.0877, + "step": 672 + }, + { + "epoch": 7.0, + "eval_LOCATION_f1": 0.9170305676855894, + "eval_LOCATION_number": 116, + "eval_LOCATION_precision": 0.9292035398230089, + "eval_LOCATION_recall": 0.9051724137931034, + "eval_ORGANIZATION_f1": 0.9164086687306501, + "eval_ORGANIZATION_number": 158, + "eval_ORGANIZATION_precision": 0.896969696969697, + "eval_ORGANIZATION_recall": 0.9367088607594937, + "eval_PERSON_f1": 0.9879518072289156, + "eval_PERSON_number": 124, + "eval_PERSON_precision": 0.984, + "eval_PERSON_recall": 0.9919354838709677, + "eval_loss": 0.04141335189342499, + "eval_overall_accuracy": 0.9857260499588252, + "eval_overall_f1": 0.9388264669163546, + "eval_overall_precision": 0.9330024813895782, + "eval_overall_recall": 0.9447236180904522, + "eval_runtime": 0.2425, + "eval_samples_per_second": 701.0, + "eval_steps_per_second": 12.371, + "step": 672 + }, + { + "epoch": 8.0, + "grad_norm": 1.0621719360351562, + "learning_rate": 4.600000000000001e-05, + "loss": 0.0772, + "step": 768 + }, + { + "epoch": 8.0, + "eval_LOCATION_f1": 0.9152542372881356, + "eval_LOCATION_number": 116, + "eval_LOCATION_precision": 0.9, + "eval_LOCATION_recall": 0.9310344827586207, + "eval_ORGANIZATION_f1": 0.91875, + "eval_ORGANIZATION_number": 158, + "eval_ORGANIZATION_precision": 0.9074074074074074, + "eval_ORGANIZATION_recall": 0.930379746835443, + "eval_PERSON_f1": 0.9840000000000001, + "eval_PERSON_number": 124, + "eval_PERSON_precision": 0.9761904761904762, + "eval_PERSON_recall": 0.9919354838709677, + "eval_loss": 0.03698663040995598, + "eval_overall_accuracy": 0.9873730441943454, + "eval_overall_f1": 0.9379652605459057, + "eval_overall_precision": 0.9264705882352942, + "eval_overall_recall": 0.949748743718593, + "eval_runtime": 0.2428, + "eval_samples_per_second": 700.264, + "eval_steps_per_second": 12.358, + "step": 768 + }, + { + "epoch": 9.0, + "grad_norm": 0.5991101861000061, + "learning_rate": 4.55e-05, + "loss": 0.0747, + "step": 864 + }, + { + "epoch": 9.0, + "eval_LOCATION_f1": 0.9288702928870294, + "eval_LOCATION_number": 116, + "eval_LOCATION_precision": 0.9024390243902439, + "eval_LOCATION_recall": 0.9568965517241379, + "eval_ORGANIZATION_f1": 0.9345794392523364, + "eval_ORGANIZATION_number": 158, + "eval_ORGANIZATION_precision": 0.9202453987730062, + "eval_ORGANIZATION_recall": 0.9493670886075949, + "eval_PERSON_f1": 0.9879518072289156, + "eval_PERSON_number": 124, + "eval_PERSON_precision": 0.984, + "eval_PERSON_recall": 0.9919354838709677, + "eval_loss": 0.04177405312657356, + "eval_overall_accuracy": 0.9860005489980785, + "eval_overall_f1": 0.9493201483312732, + "eval_overall_precision": 0.9343065693430657, + "eval_overall_recall": 0.964824120603015, + "eval_runtime": 0.2423, + "eval_samples_per_second": 701.484, + "eval_steps_per_second": 12.379, + "step": 864 + }, + { + "epoch": 10.0, + "grad_norm": 0.7477170825004578, + "learning_rate": 4.5e-05, + "loss": 0.0712, + "step": 960 + }, + { + "epoch": 10.0, + "eval_LOCATION_f1": 0.9268292682926829, + "eval_LOCATION_number": 116, + "eval_LOCATION_precision": 0.8769230769230769, + "eval_LOCATION_recall": 0.9827586206896551, + "eval_ORGANIZATION_f1": 0.9329073482428115, + "eval_ORGANIZATION_number": 158, + "eval_ORGANIZATION_precision": 0.9419354838709677, + "eval_ORGANIZATION_recall": 0.9240506329113924, + "eval_PERSON_f1": 0.9840000000000001, + "eval_PERSON_number": 124, + "eval_PERSON_precision": 0.9761904761904762, + "eval_PERSON_recall": 0.9919354838709677, + "eval_loss": 0.04179945960640907, + "eval_overall_accuracy": 0.9851770518803185, + "eval_overall_f1": 0.9468479604449939, + "eval_overall_precision": 0.9318734793187348, + "eval_overall_recall": 0.9623115577889447, + "eval_runtime": 0.2429, + "eval_samples_per_second": 699.957, + "eval_steps_per_second": 12.352, + "step": 960 + }, + { + "epoch": 11.0, + "grad_norm": 0.4425092041492462, + "learning_rate": 4.4500000000000004e-05, + "loss": 0.0645, + "step": 1056 + }, + { + "epoch": 11.0, + "eval_LOCATION_f1": 0.9191489361702128, + "eval_LOCATION_number": 116, + "eval_LOCATION_precision": 0.907563025210084, + "eval_LOCATION_recall": 0.9310344827586207, + "eval_ORGANIZATION_f1": 0.9341692789968652, + "eval_ORGANIZATION_number": 158, + "eval_ORGANIZATION_precision": 0.9254658385093167, + "eval_ORGANIZATION_recall": 0.9430379746835443, + "eval_PERSON_f1": 0.9879518072289156, + "eval_PERSON_number": 124, + "eval_PERSON_precision": 0.984, + "eval_PERSON_recall": 0.9919354838709677, + "eval_loss": 0.034665558487176895, + "eval_overall_accuracy": 0.9884710403513588, + "eval_overall_f1": 0.946450809464508, + "eval_overall_precision": 0.9382716049382716, + "eval_overall_recall": 0.9547738693467337, + "eval_runtime": 0.2429, + "eval_samples_per_second": 699.774, + "eval_steps_per_second": 12.349, + "step": 1056 + }, + { + "epoch": 12.0, + "grad_norm": 0.994752824306488, + "learning_rate": 4.4000000000000006e-05, + "loss": 0.0594, + "step": 1152 + }, + { + "epoch": 12.0, + "eval_LOCATION_f1": 0.923076923076923, + "eval_LOCATION_number": 116, + "eval_LOCATION_precision": 0.9152542372881356, + "eval_LOCATION_recall": 0.9310344827586207, + "eval_ORGANIZATION_f1": 0.9164086687306501, + "eval_ORGANIZATION_number": 158, + "eval_ORGANIZATION_precision": 0.896969696969697, + "eval_ORGANIZATION_recall": 0.9367088607594937, + "eval_PERSON_f1": 0.9840000000000001, + "eval_PERSON_number": 124, + "eval_PERSON_precision": 0.9761904761904762, + "eval_PERSON_recall": 0.9919354838709677, + "eval_loss": 0.03453850373625755, + "eval_overall_accuracy": 0.9876475432335987, + "eval_overall_f1": 0.9392812887236679, + "eval_overall_precision": 0.9266503667481663, + "eval_overall_recall": 0.9522613065326633, + "eval_runtime": 0.2433, + "eval_samples_per_second": 698.803, + "eval_steps_per_second": 12.332, + "step": 1152 + }, + { + "epoch": 13.0, + "grad_norm": 0.3863960802555084, + "learning_rate": 4.35e-05, + "loss": 0.0584, + "step": 1248 + }, + { + "epoch": 13.0, + "eval_LOCATION_f1": 0.927038626609442, + "eval_LOCATION_number": 116, + "eval_LOCATION_precision": 0.9230769230769231, + "eval_LOCATION_recall": 0.9310344827586207, + "eval_ORGANIZATION_f1": 0.9496855345911951, + "eval_ORGANIZATION_number": 158, + "eval_ORGANIZATION_precision": 0.94375, + "eval_ORGANIZATION_recall": 0.9556962025316456, + "eval_PERSON_f1": 0.9840000000000001, + "eval_PERSON_number": 124, + "eval_PERSON_precision": 0.9761904761904762, + "eval_PERSON_recall": 0.9919354838709677, + "eval_loss": 0.030687231570482254, + "eval_overall_accuracy": 0.9906670326653857, + "eval_overall_f1": 0.9538077403245941, + "eval_overall_precision": 0.9478908188585607, + "eval_overall_recall": 0.9597989949748744, + "eval_runtime": 0.2423, + "eval_samples_per_second": 701.612, + "eval_steps_per_second": 12.381, + "step": 1248 + }, + { + "epoch": 14.0, + "grad_norm": 0.7108584642410278, + "learning_rate": 4.3e-05, + "loss": 0.0533, + "step": 1344 + }, + { + "epoch": 14.0, + "eval_LOCATION_f1": 0.9276595744680851, + "eval_LOCATION_number": 116, + "eval_LOCATION_precision": 0.9159663865546218, + "eval_LOCATION_recall": 0.9396551724137931, + "eval_ORGANIZATION_f1": 0.9245283018867925, + "eval_ORGANIZATION_number": 158, + "eval_ORGANIZATION_precision": 0.91875, + "eval_ORGANIZATION_recall": 0.930379746835443, + "eval_PERSON_f1": 0.9840000000000001, + "eval_PERSON_number": 124, + "eval_PERSON_precision": 0.9761904761904762, + "eval_PERSON_recall": 0.9919354838709677, + "eval_loss": 0.03466002270579338, + "eval_overall_accuracy": 0.9879220422728521, + "eval_overall_f1": 0.9439601494396015, + "eval_overall_precision": 0.9358024691358025, + "eval_overall_recall": 0.9522613065326633, + "eval_runtime": 0.245, + "eval_samples_per_second": 694.012, + "eval_steps_per_second": 12.247, + "step": 1344 + }, + { + "epoch": 15.0, + "grad_norm": 0.4726468324661255, + "learning_rate": 4.25e-05, + "loss": 0.051, + "step": 1440 + }, + { + "epoch": 15.0, + "eval_LOCATION_f1": 0.9367088607594937, + "eval_LOCATION_number": 116, + "eval_LOCATION_precision": 0.9173553719008265, + "eval_LOCATION_recall": 0.9568965517241379, + "eval_ORGANIZATION_f1": 0.9337539432176657, + "eval_ORGANIZATION_number": 158, + "eval_ORGANIZATION_precision": 0.9308176100628931, + "eval_ORGANIZATION_recall": 0.9367088607594937, + "eval_PERSON_f1": 0.9879518072289156, + "eval_PERSON_number": 124, + "eval_PERSON_precision": 0.984, + "eval_PERSON_recall": 0.9919354838709677, + "eval_loss": 0.03434712067246437, + "eval_overall_accuracy": 0.9890200384298655, + "eval_overall_f1": 0.9514321295143213, + "eval_overall_precision": 0.9432098765432099, + "eval_overall_recall": 0.9597989949748744, + "eval_runtime": 0.2429, + "eval_samples_per_second": 699.91, + "eval_steps_per_second": 12.351, + "step": 1440 + }, + { + "epoch": 16.0, + "grad_norm": 0.5781874060630798, + "learning_rate": 4.2e-05, + "loss": 0.0498, + "step": 1536 + }, + { + "epoch": 16.0, + "eval_LOCATION_f1": 0.9243697478991596, + "eval_LOCATION_number": 116, + "eval_LOCATION_precision": 0.9016393442622951, + "eval_LOCATION_recall": 0.9482758620689655, + "eval_ORGANIZATION_f1": 0.9196141479099678, + "eval_ORGANIZATION_number": 158, + "eval_ORGANIZATION_precision": 0.934640522875817, + "eval_ORGANIZATION_recall": 0.9050632911392406, + "eval_PERSON_f1": 0.9800796812749005, + "eval_PERSON_number": 124, + "eval_PERSON_precision": 0.968503937007874, + "eval_PERSON_recall": 0.9919354838709677, + "eval_loss": 0.03455718606710434, + "eval_overall_accuracy": 0.9884710403513588, + "eval_overall_f1": 0.94, + "eval_overall_precision": 0.9353233830845771, + "eval_overall_recall": 0.9447236180904522, + "eval_runtime": 0.2432, + "eval_samples_per_second": 698.89, + "eval_steps_per_second": 12.333, + "step": 1536 + }, + { + "epoch": 17.0, + "grad_norm": 0.1878691464662552, + "learning_rate": 4.15e-05, + "loss": 0.0452, + "step": 1632 + }, + { + "epoch": 17.0, + "eval_LOCATION_f1": 0.925, + "eval_LOCATION_number": 116, + "eval_LOCATION_precision": 0.8951612903225806, + "eval_LOCATION_recall": 0.9568965517241379, + "eval_ORGANIZATION_f1": 0.9171974522292994, + "eval_ORGANIZATION_number": 158, + "eval_ORGANIZATION_precision": 0.9230769230769231, + "eval_ORGANIZATION_recall": 0.9113924050632911, + "eval_PERSON_f1": 0.9879518072289156, + "eval_PERSON_number": 124, + "eval_PERSON_precision": 0.984, + "eval_PERSON_recall": 0.9919354838709677, + "eval_loss": 0.035126231610774994, + "eval_overall_accuracy": 0.987098545155092, + "eval_overall_f1": 0.9414694894146949, + "eval_overall_precision": 0.9333333333333333, + "eval_overall_recall": 0.949748743718593, + "eval_runtime": 0.2425, + "eval_samples_per_second": 700.995, + "eval_steps_per_second": 12.37, + "step": 1632 + }, + { + "epoch": 18.0, + "grad_norm": 0.7006422877311707, + "learning_rate": 4.1e-05, + "loss": 0.0437, + "step": 1728 + }, + { + "epoch": 18.0, + "eval_LOCATION_f1": 0.9282700421940928, + "eval_LOCATION_number": 116, + "eval_LOCATION_precision": 0.9090909090909091, + "eval_LOCATION_recall": 0.9482758620689655, + "eval_ORGANIZATION_f1": 0.9433962264150944, + "eval_ORGANIZATION_number": 158, + "eval_ORGANIZATION_precision": 0.9375, + "eval_ORGANIZATION_recall": 0.9493670886075949, + "eval_PERSON_f1": 0.9879518072289156, + "eval_PERSON_number": 124, + "eval_PERSON_precision": 0.984, + "eval_PERSON_recall": 0.9919354838709677, + "eval_loss": 0.035111382603645325, + "eval_overall_accuracy": 0.9887455393906122, + "eval_overall_f1": 0.9527363184079602, + "eval_overall_precision": 0.9433497536945813, + "eval_overall_recall": 0.9623115577889447, + "eval_runtime": 0.2425, + "eval_samples_per_second": 700.948, + "eval_steps_per_second": 12.37, + "step": 1728 + }, + { + "epoch": 19.0, + "grad_norm": 0.6293537616729736, + "learning_rate": 4.05e-05, + "loss": 0.0419, + "step": 1824 + }, + { + "epoch": 19.0, + "eval_LOCATION_f1": 0.9115044247787611, + "eval_LOCATION_number": 116, + "eval_LOCATION_precision": 0.9363636363636364, + "eval_LOCATION_recall": 0.8879310344827587, + "eval_ORGANIZATION_f1": 0.9375000000000001, + "eval_ORGANIZATION_number": 158, + "eval_ORGANIZATION_precision": 0.9259259259259259, + "eval_ORGANIZATION_recall": 0.9493670886075949, + "eval_PERSON_f1": 0.9840000000000001, + "eval_PERSON_number": 124, + "eval_PERSON_precision": 0.9761904761904762, + "eval_PERSON_recall": 0.9919354838709677, + "eval_loss": 0.03315844014286995, + "eval_overall_accuracy": 0.9890200384298655, + "eval_overall_f1": 0.9447236180904522, + "eval_overall_precision": 0.9447236180904522, + "eval_overall_recall": 0.9447236180904522, + "eval_runtime": 0.2423, + "eval_samples_per_second": 701.628, + "eval_steps_per_second": 12.382, + "step": 1824 + }, + { + "epoch": 20.0, + "grad_norm": 0.43634268641471863, + "learning_rate": 4e-05, + "loss": 0.0409, + "step": 1920 + }, + { + "epoch": 20.0, + "eval_LOCATION_f1": 0.9310344827586207, + "eval_LOCATION_number": 116, + "eval_LOCATION_precision": 0.9310344827586207, + "eval_LOCATION_recall": 0.9310344827586207, + "eval_ORGANIZATION_f1": 0.9254658385093167, + "eval_ORGANIZATION_number": 158, + "eval_ORGANIZATION_precision": 0.9085365853658537, + "eval_ORGANIZATION_recall": 0.9430379746835443, + "eval_PERSON_f1": 0.9840000000000001, + "eval_PERSON_number": 124, + "eval_PERSON_precision": 0.9761904761904762, + "eval_PERSON_recall": 0.9919354838709677, + "eval_loss": 0.035573337227106094, + "eval_overall_accuracy": 0.9890200384298655, + "eval_overall_f1": 0.945273631840796, + "eval_overall_precision": 0.9359605911330049, + "eval_overall_recall": 0.9547738693467337, + "eval_runtime": 0.2427, + "eval_samples_per_second": 700.581, + "eval_steps_per_second": 12.363, + "step": 1920 + }, + { + "epoch": 21.0, + "grad_norm": 1.104005217552185, + "learning_rate": 3.9500000000000005e-05, + "loss": 0.0403, + "step": 2016 + }, + { + "epoch": 21.0, + "eval_LOCATION_f1": 0.925, + "eval_LOCATION_number": 116, + "eval_LOCATION_precision": 0.8951612903225806, + "eval_LOCATION_recall": 0.9568965517241379, + "eval_ORGANIZATION_f1": 0.9294871794871796, + "eval_ORGANIZATION_number": 158, + "eval_ORGANIZATION_precision": 0.9415584415584416, + "eval_ORGANIZATION_recall": 0.9177215189873418, + "eval_PERSON_f1": 0.9879518072289156, + "eval_PERSON_number": 124, + "eval_PERSON_precision": 0.984, + "eval_PERSON_recall": 0.9919354838709677, + "eval_loss": 0.02913746051490307, + "eval_overall_accuracy": 0.9890200384298655, + "eval_overall_f1": 0.9463171036204745, + "eval_overall_precision": 0.9404466501240695, + "eval_overall_recall": 0.9522613065326633, + "eval_runtime": 0.2423, + "eval_samples_per_second": 701.518, + "eval_steps_per_second": 12.38, + "step": 2016 + }, + { + "epoch": 22.0, + "grad_norm": 0.9109427332878113, + "learning_rate": 3.9000000000000006e-05, + "loss": 0.0368, + "step": 2112 + }, + { + "epoch": 22.0, + "eval_LOCATION_f1": 0.9304347826086956, + "eval_LOCATION_number": 116, + "eval_LOCATION_precision": 0.9385964912280702, + "eval_LOCATION_recall": 0.9224137931034483, + "eval_ORGANIZATION_f1": 0.9337539432176657, + "eval_ORGANIZATION_number": 158, + "eval_ORGANIZATION_precision": 0.9308176100628931, + "eval_ORGANIZATION_recall": 0.9367088607594937, + "eval_PERSON_f1": 0.9800796812749005, + "eval_PERSON_number": 124, + "eval_PERSON_precision": 0.968503937007874, + "eval_PERSON_recall": 0.9919354838709677, + "eval_loss": 0.03580503910779953, + "eval_overall_accuracy": 0.9895690365083722, + "eval_overall_f1": 0.9473684210526316, + "eval_overall_precision": 0.945, + "eval_overall_recall": 0.949748743718593, + "eval_runtime": 0.2428, + "eval_samples_per_second": 700.269, + "eval_steps_per_second": 12.358, + "step": 2112 + }, + { + "epoch": 23.0, + "grad_norm": 0.4533730745315552, + "learning_rate": 3.85e-05, + "loss": 0.0402, + "step": 2208 + }, + { + "epoch": 23.0, + "eval_LOCATION_f1": 0.9531914893617022, + "eval_LOCATION_number": 116, + "eval_LOCATION_precision": 0.9411764705882353, + "eval_LOCATION_recall": 0.9655172413793104, + "eval_ORGANIZATION_f1": 0.9337539432176657, + "eval_ORGANIZATION_number": 158, + "eval_ORGANIZATION_precision": 0.9308176100628931, + "eval_ORGANIZATION_recall": 0.9367088607594937, + "eval_PERSON_f1": 0.9840000000000001, + "eval_PERSON_number": 124, + "eval_PERSON_precision": 0.9761904761904762, + "eval_PERSON_recall": 0.9919354838709677, + "eval_loss": 0.02975594624876976, + "eval_overall_accuracy": 0.9903925336261323, + "eval_overall_f1": 0.9551122194513715, + "eval_overall_precision": 0.948019801980198, + "eval_overall_recall": 0.9623115577889447, + "eval_runtime": 0.2418, + "eval_samples_per_second": 703.141, + "eval_steps_per_second": 12.408, + "step": 2208 + }, + { + "epoch": 24.0, + "grad_norm": 0.4602113962173462, + "learning_rate": 3.8e-05, + "loss": 0.0353, + "step": 2304 + }, + { + "epoch": 24.0, + "eval_LOCATION_f1": 0.9406779661016949, + "eval_LOCATION_number": 116, + "eval_LOCATION_precision": 0.925, + "eval_LOCATION_recall": 0.9568965517241379, + "eval_ORGANIZATION_f1": 0.9363057324840764, + "eval_ORGANIZATION_number": 158, + "eval_ORGANIZATION_precision": 0.9423076923076923, + "eval_ORGANIZATION_recall": 0.930379746835443, + "eval_PERSON_f1": 0.9879518072289156, + "eval_PERSON_number": 124, + "eval_PERSON_precision": 0.984, + "eval_PERSON_recall": 0.9919354838709677, + "eval_loss": 0.03227541968226433, + "eval_overall_accuracy": 0.9895690365083722, + "eval_overall_f1": 0.9536921151439299, + "eval_overall_precision": 0.9501246882793017, + "eval_overall_recall": 0.957286432160804, + "eval_runtime": 0.2439, + "eval_samples_per_second": 696.954, + "eval_steps_per_second": 12.299, + "step": 2304 + }, + { + "epoch": 25.0, + "grad_norm": 0.7048800587654114, + "learning_rate": 3.7500000000000003e-05, + "loss": 0.0332, + "step": 2400 + }, + { + "epoch": 25.0, + "eval_LOCATION_f1": 0.9456066945606694, + "eval_LOCATION_number": 116, + "eval_LOCATION_precision": 0.9186991869918699, + "eval_LOCATION_recall": 0.9741379310344828, + "eval_ORGANIZATION_f1": 0.9003215434083601, + "eval_ORGANIZATION_number": 158, + "eval_ORGANIZATION_precision": 0.9150326797385621, + "eval_ORGANIZATION_recall": 0.8860759493670886, + "eval_PERSON_f1": 0.9840000000000001, + "eval_PERSON_number": 124, + "eval_PERSON_precision": 0.9761904761904762, + "eval_PERSON_recall": 0.9919354838709677, + "eval_loss": 0.03731263801455498, + "eval_overall_accuracy": 0.9887455393906122, + "eval_overall_f1": 0.94, + "eval_overall_precision": 0.9353233830845771, + "eval_overall_recall": 0.9447236180904522, + "eval_runtime": 0.2428, + "eval_samples_per_second": 700.288, + "eval_steps_per_second": 12.358, + "step": 2400 + }, + { + "epoch": 26.0, + "grad_norm": 0.6570234894752502, + "learning_rate": 3.7e-05, + "loss": 0.0343, + "step": 2496 + }, + { + "epoch": 26.0, + "eval_LOCATION_f1": 0.9406779661016949, + "eval_LOCATION_number": 116, + "eval_LOCATION_precision": 0.925, + "eval_LOCATION_recall": 0.9568965517241379, + "eval_ORGANIZATION_f1": 0.9211356466876972, + "eval_ORGANIZATION_number": 158, + "eval_ORGANIZATION_precision": 0.9182389937106918, + "eval_ORGANIZATION_recall": 0.9240506329113924, + "eval_PERSON_f1": 0.9879518072289156, + "eval_PERSON_number": 124, + "eval_PERSON_precision": 0.984, + "eval_PERSON_recall": 0.9919354838709677, + "eval_loss": 0.040523938834667206, + "eval_overall_accuracy": 0.9884710403513588, + "eval_overall_f1": 0.9476309226932669, + "eval_overall_precision": 0.9405940594059405, + "eval_overall_recall": 0.9547738693467337, + "eval_runtime": 0.2423, + "eval_samples_per_second": 701.468, + "eval_steps_per_second": 12.379, + "step": 2496 + }, + { + "epoch": 27.0, + "grad_norm": 0.9857751131057739, + "learning_rate": 3.65e-05, + "loss": 0.0342, + "step": 2592 + }, + { + "epoch": 27.0, + "eval_LOCATION_f1": 0.9406779661016949, + "eval_LOCATION_number": 116, + "eval_LOCATION_precision": 0.925, + "eval_LOCATION_recall": 0.9568965517241379, + "eval_ORGANIZATION_f1": 0.9363057324840764, + "eval_ORGANIZATION_number": 158, + "eval_ORGANIZATION_precision": 0.9423076923076923, + "eval_ORGANIZATION_recall": 0.930379746835443, + "eval_PERSON_f1": 0.9800796812749005, + "eval_PERSON_number": 124, + "eval_PERSON_precision": 0.968503937007874, + "eval_PERSON_recall": 0.9919354838709677, + "eval_loss": 0.03457554057240486, + "eval_overall_accuracy": 0.9887455393906122, + "eval_overall_f1": 0.951310861423221, + "eval_overall_precision": 0.9454094292803971, + "eval_overall_recall": 0.957286432160804, + "eval_runtime": 0.2421, + "eval_samples_per_second": 702.06, + "eval_steps_per_second": 12.389, + "step": 2592 + }, + { + "epoch": 28.0, + "grad_norm": 0.46330365538597107, + "learning_rate": 3.6e-05, + "loss": 0.032, + "step": 2688 + }, + { + "epoch": 28.0, + "eval_LOCATION_f1": 0.923076923076923, + "eval_LOCATION_number": 116, + "eval_LOCATION_precision": 0.9152542372881356, + "eval_LOCATION_recall": 0.9310344827586207, + "eval_ORGANIZATION_f1": 0.9299363057324842, + "eval_ORGANIZATION_number": 158, + "eval_ORGANIZATION_precision": 0.9358974358974359, + "eval_ORGANIZATION_recall": 0.9240506329113924, + "eval_PERSON_f1": 0.9800796812749005, + "eval_PERSON_number": 124, + "eval_PERSON_precision": 0.968503937007874, + "eval_PERSON_recall": 0.9919354838709677, + "eval_loss": 0.04411082714796066, + "eval_overall_accuracy": 0.987098545155092, + "eval_overall_f1": 0.9436795994993743, + "eval_overall_precision": 0.940149625935162, + "eval_overall_recall": 0.9472361809045227, + "eval_runtime": 0.2418, + "eval_samples_per_second": 703.003, + "eval_steps_per_second": 12.406, + "step": 2688 + }, + { + "epoch": 29.0, + "grad_norm": 0.4757544696331024, + "learning_rate": 3.55e-05, + "loss": 0.0275, + "step": 2784 + }, + { + "epoch": 29.0, + "eval_LOCATION_f1": 0.9396551724137931, + "eval_LOCATION_number": 116, + "eval_LOCATION_precision": 0.9396551724137931, + "eval_LOCATION_recall": 0.9396551724137931, + "eval_ORGANIZATION_f1": 0.9221183800623053, + "eval_ORGANIZATION_number": 158, + "eval_ORGANIZATION_precision": 0.9079754601226994, + "eval_ORGANIZATION_recall": 0.9367088607594937, + "eval_PERSON_f1": 0.9879518072289156, + "eval_PERSON_number": 124, + "eval_PERSON_precision": 0.984, + "eval_PERSON_recall": 0.9919354838709677, + "eval_loss": 0.04470400512218475, + "eval_overall_accuracy": 0.9876475432335987, + "eval_overall_f1": 0.9476309226932669, + "eval_overall_precision": 0.9405940594059405, + "eval_overall_recall": 0.9547738693467337, + "eval_runtime": 0.242, + "eval_samples_per_second": 702.55, + "eval_steps_per_second": 12.398, + "step": 2784 + }, + { + "epoch": 30.0, + "grad_norm": 1.0357615947723389, + "learning_rate": 3.5e-05, + "loss": 0.0273, + "step": 2880 + }, + { + "epoch": 30.0, + "eval_LOCATION_f1": 0.9304347826086956, + "eval_LOCATION_number": 116, + "eval_LOCATION_precision": 0.9385964912280702, + "eval_LOCATION_recall": 0.9224137931034483, + "eval_ORGANIZATION_f1": 0.9316770186335404, + "eval_ORGANIZATION_number": 158, + "eval_ORGANIZATION_precision": 0.9146341463414634, + "eval_ORGANIZATION_recall": 0.9493670886075949, + "eval_PERSON_f1": 0.9879518072289156, + "eval_PERSON_number": 124, + "eval_PERSON_precision": 0.984, + "eval_PERSON_recall": 0.9919354838709677, + "eval_loss": 0.043819691985845566, + "eval_overall_accuracy": 0.9884710403513588, + "eval_overall_f1": 0.9488139825218478, + "eval_overall_precision": 0.9429280397022333, + "eval_overall_recall": 0.9547738693467337, + "eval_runtime": 0.2421, + "eval_samples_per_second": 702.271, + "eval_steps_per_second": 12.393, + "step": 2880 + }, + { + "epoch": 31.0, + "grad_norm": 0.5754586458206177, + "learning_rate": 3.45e-05, + "loss": 0.0287, + "step": 2976 + }, + { + "epoch": 31.0, + "eval_LOCATION_f1": 0.9411764705882353, + "eval_LOCATION_number": 116, + "eval_LOCATION_precision": 0.9180327868852459, + "eval_LOCATION_recall": 0.9655172413793104, + "eval_ORGANIZATION_f1": 0.9290322580645162, + "eval_ORGANIZATION_number": 158, + "eval_ORGANIZATION_precision": 0.9473684210526315, + "eval_ORGANIZATION_recall": 0.9113924050632911, + "eval_PERSON_f1": 0.9840000000000001, + "eval_PERSON_number": 124, + "eval_PERSON_precision": 0.9761904761904762, + "eval_PERSON_recall": 0.9919354838709677, + "eval_loss": 0.035712841898202896, + "eval_overall_accuracy": 0.990118034586879, + "eval_overall_f1": 0.9498746867167919, + "eval_overall_precision": 0.9475, + "eval_overall_recall": 0.9522613065326633, + "eval_runtime": 0.242, + "eval_samples_per_second": 702.469, + "eval_steps_per_second": 12.397, + "step": 2976 + }, + { + "epoch": 32.0, + "grad_norm": 0.4603827893733978, + "learning_rate": 3.4000000000000007e-05, + "loss": 0.0274, + "step": 3072 + }, + { + "epoch": 32.0, + "eval_LOCATION_f1": 0.9288702928870294, + "eval_LOCATION_number": 116, + "eval_LOCATION_precision": 0.9024390243902439, + "eval_LOCATION_recall": 0.9568965517241379, + "eval_ORGANIZATION_f1": 0.9131832797427653, + "eval_ORGANIZATION_number": 158, + "eval_ORGANIZATION_precision": 0.9281045751633987, + "eval_ORGANIZATION_recall": 0.8987341772151899, + "eval_PERSON_f1": 0.9840000000000001, + "eval_PERSON_number": 124, + "eval_PERSON_precision": 0.9761904761904762, + "eval_PERSON_recall": 0.9919354838709677, + "eval_loss": 0.04034664109349251, + "eval_overall_accuracy": 0.9881965413121054, + "eval_overall_f1": 0.94, + "eval_overall_precision": 0.9353233830845771, + "eval_overall_recall": 0.9447236180904522, + "eval_runtime": 0.2418, + "eval_samples_per_second": 703.177, + "eval_steps_per_second": 12.409, + "step": 3072 + }, + { + "epoch": 33.0, + "grad_norm": 0.4669646620750427, + "learning_rate": 3.35e-05, + "loss": 0.0284, + "step": 3168 + }, + { + "epoch": 33.0, + "eval_LOCATION_f1": 0.9327731092436975, + "eval_LOCATION_number": 116, + "eval_LOCATION_precision": 0.9098360655737705, + "eval_LOCATION_recall": 0.9568965517241379, + "eval_ORGANIZATION_f1": 0.9196141479099678, + "eval_ORGANIZATION_number": 158, + "eval_ORGANIZATION_precision": 0.934640522875817, + "eval_ORGANIZATION_recall": 0.9050632911392406, + "eval_PERSON_f1": 0.9840000000000001, + "eval_PERSON_number": 124, + "eval_PERSON_precision": 0.9761904761904762, + "eval_PERSON_recall": 0.9919354838709677, + "eval_loss": 0.04073726758360863, + "eval_overall_accuracy": 0.9879220422728521, + "eval_overall_f1": 0.9436795994993743, + "eval_overall_precision": 0.940149625935162, + "eval_overall_recall": 0.9472361809045227, + "eval_runtime": 0.2426, + "eval_samples_per_second": 700.664, + "eval_steps_per_second": 12.365, + "step": 3168 + }, + { + "epoch": 34.0, + "grad_norm": 0.14242352545261383, + "learning_rate": 3.3e-05, + "loss": 0.0269, + "step": 3264 + }, + { + "epoch": 34.0, + "eval_LOCATION_f1": 0.9406779661016949, + "eval_LOCATION_number": 116, + "eval_LOCATION_precision": 0.925, + "eval_LOCATION_recall": 0.9568965517241379, + "eval_ORGANIZATION_f1": 0.9312499999999999, + "eval_ORGANIZATION_number": 158, + "eval_ORGANIZATION_precision": 0.9197530864197531, + "eval_ORGANIZATION_recall": 0.9430379746835443, + "eval_PERSON_f1": 0.9879518072289156, + "eval_PERSON_number": 124, + "eval_PERSON_precision": 0.984, + "eval_PERSON_recall": 0.9919354838709677, + "eval_loss": 0.04001469165086746, + "eval_overall_accuracy": 0.9895690365083722, + "eval_overall_f1": 0.9515527950310558, + "eval_overall_precision": 0.941031941031941, + "eval_overall_recall": 0.9623115577889447, + "eval_runtime": 0.2432, + "eval_samples_per_second": 698.955, + "eval_steps_per_second": 12.334, + "step": 3264 + }, + { + "epoch": 35.0, + "grad_norm": 0.5518023371696472, + "learning_rate": 3.2500000000000004e-05, + "loss": 0.0245, + "step": 3360 + }, + { + "epoch": 35.0, + "eval_LOCATION_f1": 0.935064935064935, + "eval_LOCATION_number": 116, + "eval_LOCATION_precision": 0.9391304347826087, + "eval_LOCATION_recall": 0.9310344827586207, + "eval_ORGANIZATION_f1": 0.9226006191950465, + "eval_ORGANIZATION_number": 158, + "eval_ORGANIZATION_precision": 0.9030303030303031, + "eval_ORGANIZATION_recall": 0.9430379746835443, + "eval_PERSON_f1": 0.9840000000000001, + "eval_PERSON_number": 124, + "eval_PERSON_precision": 0.9761904761904762, + "eval_PERSON_recall": 0.9919354838709677, + "eval_loss": 0.03874511644244194, + "eval_overall_accuracy": 0.9884710403513588, + "eval_overall_f1": 0.945273631840796, + "eval_overall_precision": 0.9359605911330049, + "eval_overall_recall": 0.9547738693467337, + "eval_runtime": 0.2431, + "eval_samples_per_second": 699.42, + "eval_steps_per_second": 12.343, + "step": 3360 + }, + { + "epoch": 36.0, + "grad_norm": 1.2177473306655884, + "learning_rate": 3.2000000000000005e-05, + "loss": 0.0251, + "step": 3456 + }, + { + "epoch": 36.0, + "eval_LOCATION_f1": 0.9406779661016949, + "eval_LOCATION_number": 116, + "eval_LOCATION_precision": 0.925, + "eval_LOCATION_recall": 0.9568965517241379, + "eval_ORGANIZATION_f1": 0.9308176100628932, + "eval_ORGANIZATION_number": 158, + "eval_ORGANIZATION_precision": 0.925, + "eval_ORGANIZATION_recall": 0.9367088607594937, + "eval_PERSON_f1": 0.9879518072289156, + "eval_PERSON_number": 124, + "eval_PERSON_precision": 0.984, + "eval_PERSON_recall": 0.9919354838709677, + "eval_loss": 0.03678901121020317, + "eval_overall_accuracy": 0.9895690365083722, + "eval_overall_f1": 0.9514321295143213, + "eval_overall_precision": 0.9432098765432099, + "eval_overall_recall": 0.9597989949748744, + "eval_runtime": 0.2423, + "eval_samples_per_second": 701.694, + "eval_steps_per_second": 12.383, + "step": 3456 + }, + { + "epoch": 37.0, + "grad_norm": 1.4173684120178223, + "learning_rate": 3.15e-05, + "loss": 0.0243, + "step": 3552 + }, + { + "epoch": 37.0, + "eval_LOCATION_f1": 0.9356223175965666, + "eval_LOCATION_number": 116, + "eval_LOCATION_precision": 0.9316239316239316, + "eval_LOCATION_recall": 0.9396551724137931, + "eval_ORGANIZATION_f1": 0.9333333333333332, + "eval_ORGANIZATION_number": 158, + "eval_ORGANIZATION_precision": 0.9363057324840764, + "eval_ORGANIZATION_recall": 0.930379746835443, + "eval_PERSON_f1": 0.9800796812749005, + "eval_PERSON_number": 124, + "eval_PERSON_precision": 0.968503937007874, + "eval_PERSON_recall": 0.9919354838709677, + "eval_loss": 0.03889763355255127, + "eval_overall_accuracy": 0.9895690365083722, + "eval_overall_f1": 0.9486858573216519, + "eval_overall_precision": 0.9451371571072319, + "eval_overall_recall": 0.9522613065326633, + "eval_runtime": 0.2444, + "eval_samples_per_second": 695.549, + "eval_steps_per_second": 12.274, + "step": 3552 + }, + { + "epoch": 38.0, + "grad_norm": 0.6296694874763489, + "learning_rate": 3.1e-05, + "loss": 0.0242, + "step": 3648 + }, + { + "epoch": 38.0, + "eval_LOCATION_f1": 0.9113924050632911, + "eval_LOCATION_number": 116, + "eval_LOCATION_precision": 0.8925619834710744, + "eval_LOCATION_recall": 0.9310344827586207, + "eval_ORGANIZATION_f1": 0.9235668789808917, + "eval_ORGANIZATION_number": 158, + "eval_ORGANIZATION_precision": 0.9294871794871795, + "eval_ORGANIZATION_recall": 0.9177215189873418, + "eval_PERSON_f1": 0.9840000000000001, + "eval_PERSON_number": 124, + "eval_PERSON_precision": 0.9761904761904762, + "eval_PERSON_recall": 0.9919354838709677, + "eval_loss": 0.04012976959347725, + "eval_overall_accuracy": 0.9879220422728521, + "eval_overall_f1": 0.9388264669163546, + "eval_overall_precision": 0.9330024813895782, + "eval_overall_recall": 0.9447236180904522, + "eval_runtime": 0.2429, + "eval_samples_per_second": 699.989, + "eval_steps_per_second": 12.353, + "step": 3648 + }, + { + "epoch": 39.0, + "grad_norm": 0.07241743803024292, + "learning_rate": 3.05e-05, + "loss": 0.0244, + "step": 3744 + }, + { + "epoch": 39.0, + "eval_LOCATION_f1": 0.9406779661016949, + "eval_LOCATION_number": 116, + "eval_LOCATION_precision": 0.925, + "eval_LOCATION_recall": 0.9568965517241379, + "eval_ORGANIZATION_f1": 0.9329073482428115, + "eval_ORGANIZATION_number": 158, + "eval_ORGANIZATION_precision": 0.9419354838709677, + "eval_ORGANIZATION_recall": 0.9240506329113924, + "eval_PERSON_f1": 0.9800796812749005, + "eval_PERSON_number": 124, + "eval_PERSON_precision": 0.968503937007874, + "eval_PERSON_recall": 0.9919354838709677, + "eval_loss": 0.04065397381782532, + "eval_overall_accuracy": 0.9876475432335987, + "eval_overall_f1": 0.95, + "eval_overall_precision": 0.945273631840796, + "eval_overall_recall": 0.9547738693467337, + "eval_runtime": 0.2421, + "eval_samples_per_second": 702.128, + "eval_steps_per_second": 12.39, + "step": 3744 + }, + { + "epoch": 40.0, + "grad_norm": 0.13085119426250458, + "learning_rate": 3e-05, + "loss": 0.0211, + "step": 3840 + }, + { + "epoch": 40.0, + "eval_LOCATION_f1": 0.9361702127659575, + "eval_LOCATION_number": 116, + "eval_LOCATION_precision": 0.9243697478991597, + "eval_LOCATION_recall": 0.9482758620689655, + "eval_ORGANIZATION_f1": 0.9375000000000001, + "eval_ORGANIZATION_number": 158, + "eval_ORGANIZATION_precision": 0.9259259259259259, + "eval_ORGANIZATION_recall": 0.9493670886075949, + "eval_PERSON_f1": 0.9840000000000001, + "eval_PERSON_number": 124, + "eval_PERSON_precision": 0.9761904761904762, + "eval_PERSON_recall": 0.9919354838709677, + "eval_loss": 0.04333576187491417, + "eval_overall_accuracy": 0.9890200384298655, + "eval_overall_f1": 0.9515527950310558, + "eval_overall_precision": 0.941031941031941, + "eval_overall_recall": 0.9623115577889447, + "eval_runtime": 0.2428, + "eval_samples_per_second": 700.162, + "eval_steps_per_second": 12.356, + "step": 3840 + }, + { + "epoch": 41.0, + "grad_norm": 0.029861435294151306, + "learning_rate": 2.95e-05, + "loss": 0.0223, + "step": 3936 + }, + { + "epoch": 41.0, + "eval_LOCATION_f1": 0.944206008583691, + "eval_LOCATION_number": 116, + "eval_LOCATION_precision": 0.9401709401709402, + "eval_LOCATION_recall": 0.9482758620689655, + "eval_ORGANIZATION_f1": 0.9278996865203761, + "eval_ORGANIZATION_number": 158, + "eval_ORGANIZATION_precision": 0.9192546583850931, + "eval_ORGANIZATION_recall": 0.9367088607594937, + "eval_PERSON_f1": 0.9840000000000001, + "eval_PERSON_number": 124, + "eval_PERSON_precision": 0.9761904761904762, + "eval_PERSON_recall": 0.9919354838709677, + "eval_loss": 0.03654933720827103, + "eval_overall_accuracy": 0.9892945374691189, + "eval_overall_f1": 0.9501246882793017, + "eval_overall_precision": 0.943069306930693, + "eval_overall_recall": 0.957286432160804, + "eval_runtime": 0.2424, + "eval_samples_per_second": 701.253, + "eval_steps_per_second": 12.375, + "step": 3936 + }, + { + "epoch": 42.0, + "grad_norm": 0.09470277279615402, + "learning_rate": 2.9e-05, + "loss": 0.0224, + "step": 4032 + }, + { + "epoch": 42.0, + "eval_LOCATION_f1": 0.94017094017094, + "eval_LOCATION_number": 116, + "eval_LOCATION_precision": 0.9322033898305084, + "eval_LOCATION_recall": 0.9482758620689655, + "eval_ORGANIZATION_f1": 0.9278996865203761, + "eval_ORGANIZATION_number": 158, + "eval_ORGANIZATION_precision": 0.9192546583850931, + "eval_ORGANIZATION_recall": 0.9367088607594937, + "eval_PERSON_f1": 0.9840000000000001, + "eval_PERSON_number": 124, + "eval_PERSON_precision": 0.9761904761904762, + "eval_PERSON_recall": 0.9919354838709677, + "eval_loss": 0.039208512753248215, + "eval_overall_accuracy": 0.9895690365083722, + "eval_overall_f1": 0.9489414694894147, + "eval_overall_precision": 0.9407407407407408, + "eval_overall_recall": 0.957286432160804, + "eval_runtime": 0.2423, + "eval_samples_per_second": 701.592, + "eval_steps_per_second": 12.381, + "step": 4032 + }, + { + "epoch": 43.0, + "grad_norm": 0.29208576679229736, + "learning_rate": 2.8499999999999998e-05, + "loss": 0.0197, + "step": 4128 + }, + { + "epoch": 43.0, + "eval_LOCATION_f1": 0.9316239316239315, + "eval_LOCATION_number": 116, + "eval_LOCATION_precision": 0.923728813559322, + "eval_LOCATION_recall": 0.9396551724137931, + "eval_ORGANIZATION_f1": 0.9274447949526813, + "eval_ORGANIZATION_number": 158, + "eval_ORGANIZATION_precision": 0.9245283018867925, + "eval_ORGANIZATION_recall": 0.930379746835443, + "eval_PERSON_f1": 0.9761904761904763, + "eval_PERSON_number": 124, + "eval_PERSON_precision": 0.9609375, + "eval_PERSON_recall": 0.9919354838709677, + "eval_loss": 0.03720787167549133, + "eval_overall_accuracy": 0.9890200384298655, + "eval_overall_f1": 0.9439601494396015, + "eval_overall_precision": 0.9358024691358025, + "eval_overall_recall": 0.9522613065326633, + "eval_runtime": 0.242, + "eval_samples_per_second": 702.453, + "eval_steps_per_second": 12.396, + "step": 4128 + }, + { + "epoch": 44.0, + "grad_norm": 0.3295332193374634, + "learning_rate": 2.8000000000000003e-05, + "loss": 0.022, + "step": 4224 + }, + { + "epoch": 44.0, + "eval_LOCATION_f1": 0.9446808510638298, + "eval_LOCATION_number": 116, + "eval_LOCATION_precision": 0.9327731092436975, + "eval_LOCATION_recall": 0.9568965517241379, + "eval_ORGANIZATION_f1": 0.9177215189873418, + "eval_ORGANIZATION_number": 158, + "eval_ORGANIZATION_precision": 0.9177215189873418, + "eval_ORGANIZATION_recall": 0.9177215189873418, + "eval_PERSON_f1": 0.9800796812749005, + "eval_PERSON_number": 124, + "eval_PERSON_precision": 0.968503937007874, + "eval_PERSON_recall": 0.9919354838709677, + "eval_loss": 0.04005124792456627, + "eval_overall_accuracy": 0.9884710403513588, + "eval_overall_f1": 0.9451371571072318, + "eval_overall_precision": 0.9381188118811881, + "eval_overall_recall": 0.9522613065326633, + "eval_runtime": 0.2427, + "eval_samples_per_second": 700.36, + "eval_steps_per_second": 12.359, + "step": 4224 + }, + { + "epoch": 45.0, + "grad_norm": 1.0696682929992676, + "learning_rate": 2.7500000000000004e-05, + "loss": 0.0192, + "step": 4320 + }, + { + "epoch": 45.0, + "eval_LOCATION_f1": 0.9406779661016949, + "eval_LOCATION_number": 116, + "eval_LOCATION_precision": 0.925, + "eval_LOCATION_recall": 0.9568965517241379, + "eval_ORGANIZATION_f1": 0.926517571884984, + "eval_ORGANIZATION_number": 158, + "eval_ORGANIZATION_precision": 0.9354838709677419, + "eval_ORGANIZATION_recall": 0.9177215189873418, + "eval_PERSON_f1": 0.9840000000000001, + "eval_PERSON_number": 124, + "eval_PERSON_precision": 0.9761904761904762, + "eval_PERSON_recall": 0.9919354838709677, + "eval_loss": 0.04148309305310249, + "eval_overall_accuracy": 0.9887455393906122, + "eval_overall_f1": 0.9486858573216519, + "eval_overall_precision": 0.9451371571072319, + "eval_overall_recall": 0.9522613065326633, + "eval_runtime": 0.2424, + "eval_samples_per_second": 701.317, + "eval_steps_per_second": 12.376, + "step": 4320 + }, + { + "epoch": 46.0, + "grad_norm": 0.5310882925987244, + "learning_rate": 2.7000000000000002e-05, + "loss": 0.0197, + "step": 4416 + }, + { + "epoch": 46.0, + "eval_LOCATION_f1": 0.9456066945606694, + "eval_LOCATION_number": 116, + "eval_LOCATION_precision": 0.9186991869918699, + "eval_LOCATION_recall": 0.9741379310344828, + "eval_ORGANIZATION_f1": 0.9274447949526813, + "eval_ORGANIZATION_number": 158, + "eval_ORGANIZATION_precision": 0.9245283018867925, + "eval_ORGANIZATION_recall": 0.930379746835443, + "eval_PERSON_f1": 0.9840000000000001, + "eval_PERSON_number": 124, + "eval_PERSON_precision": 0.9761904761904762, + "eval_PERSON_recall": 0.9919354838709677, + "eval_loss": 0.03862782195210457, + "eval_overall_accuracy": 0.990118034586879, + "eval_overall_f1": 0.9503722084367245, + "eval_overall_precision": 0.9387254901960784, + "eval_overall_recall": 0.9623115577889447, + "eval_runtime": 0.2435, + "eval_samples_per_second": 698.028, + "eval_steps_per_second": 12.318, + "step": 4416 + }, + { + "epoch": 47.0, + "grad_norm": 0.36547964811325073, + "learning_rate": 2.6500000000000004e-05, + "loss": 0.02, + "step": 4512 + }, + { + "epoch": 47.0, + "eval_LOCATION_f1": 0.944206008583691, + "eval_LOCATION_number": 116, + "eval_LOCATION_precision": 0.9401709401709402, + "eval_LOCATION_recall": 0.9482758620689655, + "eval_ORGANIZATION_f1": 0.940809968847352, + "eval_ORGANIZATION_number": 158, + "eval_ORGANIZATION_precision": 0.9263803680981595, + "eval_ORGANIZATION_recall": 0.9556962025316456, + "eval_PERSON_f1": 0.9800796812749005, + "eval_PERSON_number": 124, + "eval_PERSON_precision": 0.968503937007874, + "eval_PERSON_recall": 0.9919354838709677, + "eval_loss": 0.042170971632003784, + "eval_overall_accuracy": 0.9892945374691189, + "eval_overall_f1": 0.9540372670807453, + "eval_overall_precision": 0.9434889434889435, + "eval_overall_recall": 0.964824120603015, + "eval_runtime": 0.2438, + "eval_samples_per_second": 697.197, + "eval_steps_per_second": 12.303, + "step": 4512 + }, + { + "epoch": 48.0, + "grad_norm": 0.4364250600337982, + "learning_rate": 2.6000000000000002e-05, + "loss": 0.0192, + "step": 4608 + }, + { + "epoch": 48.0, + "eval_LOCATION_f1": 0.9411764705882353, + "eval_LOCATION_number": 116, + "eval_LOCATION_precision": 0.9180327868852459, + "eval_LOCATION_recall": 0.9655172413793104, + "eval_ORGANIZATION_f1": 0.923076923076923, + "eval_ORGANIZATION_number": 158, + "eval_ORGANIZATION_precision": 0.935064935064935, + "eval_ORGANIZATION_recall": 0.9113924050632911, + "eval_PERSON_f1": 0.9879518072289156, + "eval_PERSON_number": 124, + "eval_PERSON_precision": 0.984, + "eval_PERSON_recall": 0.9919354838709677, + "eval_loss": 0.03884365037083626, + "eval_overall_accuracy": 0.9879220422728521, + "eval_overall_f1": 0.9486858573216519, + "eval_overall_precision": 0.9451371571072319, + "eval_overall_recall": 0.9522613065326633, + "eval_runtime": 0.2413, + "eval_samples_per_second": 704.424, + "eval_steps_per_second": 12.431, + "step": 4608 + }, + { + "epoch": 49.0, + "grad_norm": 0.6926938891410828, + "learning_rate": 2.5500000000000003e-05, + "loss": 0.0182, + "step": 4704 + }, + { + "epoch": 49.0, + "eval_LOCATION_f1": 0.9535864978902953, + "eval_LOCATION_number": 116, + "eval_LOCATION_precision": 0.9338842975206612, + "eval_LOCATION_recall": 0.9741379310344828, + "eval_ORGANIZATION_f1": 0.9430379746835443, + "eval_ORGANIZATION_number": 158, + "eval_ORGANIZATION_precision": 0.9430379746835443, + "eval_ORGANIZATION_recall": 0.9430379746835443, + "eval_PERSON_f1": 0.9879518072289156, + "eval_PERSON_number": 124, + "eval_PERSON_precision": 0.984, + "eval_PERSON_recall": 0.9919354838709677, + "eval_loss": 0.04192095994949341, + "eval_overall_accuracy": 0.9895690365083722, + "eval_overall_f1": 0.9600997506234414, + "eval_overall_precision": 0.9529702970297029, + "eval_overall_recall": 0.9673366834170855, + "eval_runtime": 0.2413, + "eval_samples_per_second": 704.587, + "eval_steps_per_second": 12.434, + "step": 4704 + }, + { + "epoch": 50.0, + "grad_norm": 0.5129674673080444, + "learning_rate": 2.5e-05, + "loss": 0.0182, + "step": 4800 + }, + { + "epoch": 50.0, + "eval_LOCATION_f1": 0.9491525423728815, + "eval_LOCATION_number": 116, + "eval_LOCATION_precision": 0.9333333333333333, + "eval_LOCATION_recall": 0.9655172413793104, + "eval_ORGANIZATION_f1": 0.9142857142857144, + "eval_ORGANIZATION_number": 158, + "eval_ORGANIZATION_precision": 0.9171974522292994, + "eval_ORGANIZATION_recall": 0.9113924050632911, + "eval_PERSON_f1": 0.9800796812749005, + "eval_PERSON_number": 124, + "eval_PERSON_precision": 0.968503937007874, + "eval_PERSON_recall": 0.9919354838709677, + "eval_loss": 0.04355218634009361, + "eval_overall_accuracy": 0.9881965413121054, + "eval_overall_f1": 0.9451371571072318, + "eval_overall_precision": 0.9381188118811881, + "eval_overall_recall": 0.9522613065326633, + "eval_runtime": 0.2421, + "eval_samples_per_second": 702.06, + "eval_steps_per_second": 12.389, + "step": 4800 + }, + { + "epoch": 51.0, + "grad_norm": 0.3724958598613739, + "learning_rate": 2.45e-05, + "loss": 0.0196, + "step": 4896 + }, + { + "epoch": 51.0, + "eval_LOCATION_f1": 0.9367088607594937, + "eval_LOCATION_number": 116, + "eval_LOCATION_precision": 0.9173553719008265, + "eval_LOCATION_recall": 0.9568965517241379, + "eval_ORGANIZATION_f1": 0.9294871794871796, + "eval_ORGANIZATION_number": 158, + "eval_ORGANIZATION_precision": 0.9415584415584416, + "eval_ORGANIZATION_recall": 0.9177215189873418, + "eval_PERSON_f1": 0.9761904761904763, + "eval_PERSON_number": 124, + "eval_PERSON_precision": 0.9609375, + "eval_PERSON_recall": 0.9919354838709677, + "eval_loss": 0.04640508443117142, + "eval_overall_accuracy": 0.9876475432335987, + "eval_overall_f1": 0.9463171036204745, + "eval_overall_precision": 0.9404466501240695, + "eval_overall_recall": 0.9522613065326633, + "eval_runtime": 0.2424, + "eval_samples_per_second": 701.373, + "eval_steps_per_second": 12.377, + "step": 4896 + }, + { + "epoch": 52.0, + "grad_norm": 0.4651976525783539, + "learning_rate": 2.4e-05, + "loss": 0.016, + "step": 4992 + }, + { + "epoch": 52.0, + "eval_LOCATION_f1": 0.9288702928870294, + "eval_LOCATION_number": 116, + "eval_LOCATION_precision": 0.9024390243902439, + "eval_LOCATION_recall": 0.9568965517241379, + "eval_ORGANIZATION_f1": 0.923076923076923, + "eval_ORGANIZATION_number": 158, + "eval_ORGANIZATION_precision": 0.935064935064935, + "eval_ORGANIZATION_recall": 0.9113924050632911, + "eval_PERSON_f1": 0.9761904761904763, + "eval_PERSON_number": 124, + "eval_PERSON_precision": 0.9609375, + "eval_PERSON_recall": 0.9919354838709677, + "eval_loss": 0.04982294142246246, + "eval_overall_accuracy": 0.987098545155092, + "eval_overall_f1": 0.9414694894146949, + "eval_overall_precision": 0.9333333333333333, + "eval_overall_recall": 0.949748743718593, + "eval_runtime": 0.2422, + "eval_samples_per_second": 702.013, + "eval_steps_per_second": 12.388, + "step": 4992 + }, + { + "epoch": 53.0, + "grad_norm": 0.3692150413990021, + "learning_rate": 2.35e-05, + "loss": 0.0174, + "step": 5088 + }, + { + "epoch": 53.0, + "eval_LOCATION_f1": 0.944206008583691, + "eval_LOCATION_number": 116, + "eval_LOCATION_precision": 0.9401709401709402, + "eval_LOCATION_recall": 0.9482758620689655, + "eval_ORGANIZATION_f1": 0.9426751592356688, + "eval_ORGANIZATION_number": 158, + "eval_ORGANIZATION_precision": 0.9487179487179487, + "eval_ORGANIZATION_recall": 0.9367088607594937, + "eval_PERSON_f1": 0.9761904761904763, + "eval_PERSON_number": 124, + "eval_PERSON_precision": 0.9609375, + "eval_PERSON_recall": 0.9919354838709677, + "eval_loss": 0.047746025025844574, + "eval_overall_accuracy": 0.9887455393906122, + "eval_overall_f1": 0.9536921151439299, + "eval_overall_precision": 0.9501246882793017, + "eval_overall_recall": 0.957286432160804, + "eval_runtime": 0.2418, + "eval_samples_per_second": 703.203, + "eval_steps_per_second": 12.409, + "step": 5088 + }, + { + "epoch": 54.0, + "grad_norm": 2.322037935256958, + "learning_rate": 2.3000000000000003e-05, + "loss": 0.0156, + "step": 5184 + }, + { + "epoch": 54.0, + "eval_LOCATION_f1": 0.944206008583691, + "eval_LOCATION_number": 116, + "eval_LOCATION_precision": 0.9401709401709402, + "eval_LOCATION_recall": 0.9482758620689655, + "eval_ORGANIZATION_f1": 0.9363057324840764, + "eval_ORGANIZATION_number": 158, + "eval_ORGANIZATION_precision": 0.9423076923076923, + "eval_ORGANIZATION_recall": 0.930379746835443, + "eval_PERSON_f1": 0.9800796812749005, + "eval_PERSON_number": 124, + "eval_PERSON_precision": 0.968503937007874, + "eval_PERSON_recall": 0.9919354838709677, + "eval_loss": 0.05073067173361778, + "eval_overall_accuracy": 0.9881965413121054, + "eval_overall_f1": 0.9523809523809523, + "eval_overall_precision": 0.95, + "eval_overall_recall": 0.9547738693467337, + "eval_runtime": 0.2418, + "eval_samples_per_second": 703.172, + "eval_steps_per_second": 12.409, + "step": 5184 + }, + { + "epoch": 55.0, + "grad_norm": 0.8182074427604675, + "learning_rate": 2.25e-05, + "loss": 0.0161, + "step": 5280 + }, + { + "epoch": 55.0, + "eval_LOCATION_f1": 0.944206008583691, + "eval_LOCATION_number": 116, + "eval_LOCATION_precision": 0.9401709401709402, + "eval_LOCATION_recall": 0.9482758620689655, + "eval_ORGANIZATION_f1": 0.9235668789808917, + "eval_ORGANIZATION_number": 158, + "eval_ORGANIZATION_precision": 0.9294871794871795, + "eval_ORGANIZATION_recall": 0.9177215189873418, + "eval_PERSON_f1": 0.9800796812749005, + "eval_PERSON_number": 124, + "eval_PERSON_precision": 0.968503937007874, + "eval_PERSON_recall": 0.9919354838709677, + "eval_loss": 0.04936642944812775, + "eval_overall_accuracy": 0.9887455393906122, + "eval_overall_f1": 0.9473684210526316, + "eval_overall_precision": 0.945, + "eval_overall_recall": 0.949748743718593, + "eval_runtime": 0.2422, + "eval_samples_per_second": 701.981, + "eval_steps_per_second": 12.388, + "step": 5280 + }, + { + "epoch": 56.0, + "grad_norm": 0.47536519169807434, + "learning_rate": 2.2000000000000003e-05, + "loss": 0.0154, + "step": 5376 + }, + { + "epoch": 56.0, + "eval_LOCATION_f1": 0.9322033898305084, + "eval_LOCATION_number": 116, + "eval_LOCATION_precision": 0.9166666666666666, + "eval_LOCATION_recall": 0.9482758620689655, + "eval_ORGANIZATION_f1": 0.9177215189873418, + "eval_ORGANIZATION_number": 158, + "eval_ORGANIZATION_precision": 0.9177215189873418, + "eval_ORGANIZATION_recall": 0.9177215189873418, + "eval_PERSON_f1": 0.9840000000000001, + "eval_PERSON_number": 124, + "eval_PERSON_precision": 0.9761904761904762, + "eval_PERSON_recall": 0.9919354838709677, + "eval_loss": 0.04633556678891182, + "eval_overall_accuracy": 0.9884710403513588, + "eval_overall_f1": 0.9426433915211971, + "eval_overall_precision": 0.9356435643564357, + "eval_overall_recall": 0.949748743718593, + "eval_runtime": 0.2421, + "eval_samples_per_second": 702.149, + "eval_steps_per_second": 12.391, + "step": 5376 + }, + { + "epoch": 57.0, + "grad_norm": 0.4734033942222595, + "learning_rate": 2.15e-05, + "loss": 0.0159, + "step": 5472 + }, + { + "epoch": 57.0, + "eval_LOCATION_f1": 0.9482758620689655, + "eval_LOCATION_number": 116, + "eval_LOCATION_precision": 0.9482758620689655, + "eval_LOCATION_recall": 0.9482758620689655, + "eval_ORGANIZATION_f1": 0.9245283018867925, + "eval_ORGANIZATION_number": 158, + "eval_ORGANIZATION_precision": 0.91875, + "eval_ORGANIZATION_recall": 0.930379746835443, + "eval_PERSON_f1": 0.9840000000000001, + "eval_PERSON_number": 124, + "eval_PERSON_precision": 0.9761904761904762, + "eval_PERSON_recall": 0.9919354838709677, + "eval_loss": 0.04754474759101868, + "eval_overall_accuracy": 0.9881965413121054, + "eval_overall_f1": 0.95, + "eval_overall_precision": 0.945273631840796, + "eval_overall_recall": 0.9547738693467337, + "eval_runtime": 0.2424, + "eval_samples_per_second": 701.32, + "eval_steps_per_second": 12.376, + "step": 5472 + }, + { + "epoch": 58.0, + "grad_norm": 0.09098278731107712, + "learning_rate": 2.1e-05, + "loss": 0.0159, + "step": 5568 + }, + { + "epoch": 58.0, + "eval_LOCATION_f1": 0.9327731092436975, + "eval_LOCATION_number": 116, + "eval_LOCATION_precision": 0.9098360655737705, + "eval_LOCATION_recall": 0.9568965517241379, + "eval_ORGANIZATION_f1": 0.9260450160771704, + "eval_ORGANIZATION_number": 158, + "eval_ORGANIZATION_precision": 0.9411764705882353, + "eval_ORGANIZATION_recall": 0.9113924050632911, + "eval_PERSON_f1": 0.9840000000000001, + "eval_PERSON_number": 124, + "eval_PERSON_precision": 0.9761904761904762, + "eval_PERSON_recall": 0.9919354838709677, + "eval_loss": 0.049943216145038605, + "eval_overall_accuracy": 0.9873730441943454, + "eval_overall_f1": 0.9461827284105131, + "eval_overall_precision": 0.942643391521197, + "eval_overall_recall": 0.949748743718593, + "eval_runtime": 0.2423, + "eval_samples_per_second": 701.712, + "eval_steps_per_second": 12.383, + "step": 5568 + }, + { + "epoch": 59.0, + "grad_norm": 0.28300827741622925, + "learning_rate": 2.05e-05, + "loss": 0.0154, + "step": 5664 + }, + { + "epoch": 59.0, + "eval_LOCATION_f1": 0.9406779661016949, + "eval_LOCATION_number": 116, + "eval_LOCATION_precision": 0.925, + "eval_LOCATION_recall": 0.9568965517241379, + "eval_ORGANIZATION_f1": 0.926984126984127, + "eval_ORGANIZATION_number": 158, + "eval_ORGANIZATION_precision": 0.9299363057324841, + "eval_ORGANIZATION_recall": 0.9240506329113924, + "eval_PERSON_f1": 0.9800796812749005, + "eval_PERSON_number": 124, + "eval_PERSON_precision": 0.968503937007874, + "eval_PERSON_recall": 0.9919354838709677, + "eval_loss": 0.04638950154185295, + "eval_overall_accuracy": 0.9881965413121054, + "eval_overall_f1": 0.9476309226932669, + "eval_overall_precision": 0.9405940594059405, + "eval_overall_recall": 0.9547738693467337, + "eval_runtime": 0.2422, + "eval_samples_per_second": 701.998, + "eval_steps_per_second": 12.388, + "step": 5664 + }, + { + "epoch": 60.0, + "grad_norm": 0.24135783314704895, + "learning_rate": 2e-05, + "loss": 0.0146, + "step": 5760 + }, + { + "epoch": 60.0, + "eval_LOCATION_f1": 0.9372384937238494, + "eval_LOCATION_number": 116, + "eval_LOCATION_precision": 0.9105691056910569, + "eval_LOCATION_recall": 0.9655172413793104, + "eval_ORGANIZATION_f1": 0.9396825396825397, + "eval_ORGANIZATION_number": 158, + "eval_ORGANIZATION_precision": 0.9426751592356688, + "eval_ORGANIZATION_recall": 0.9367088607594937, + "eval_PERSON_f1": 0.9800796812749005, + "eval_PERSON_number": 124, + "eval_PERSON_precision": 0.968503937007874, + "eval_PERSON_recall": 0.9919354838709677, + "eval_loss": 0.05022583156824112, + "eval_overall_accuracy": 0.9881965413121054, + "eval_overall_f1": 0.9515527950310558, + "eval_overall_precision": 0.941031941031941, + "eval_overall_recall": 0.9623115577889447, + "eval_runtime": 0.2423, + "eval_samples_per_second": 701.667, + "eval_steps_per_second": 12.382, + "step": 5760 + }, + { + "epoch": 61.0, + "grad_norm": 0.48841485381126404, + "learning_rate": 1.9500000000000003e-05, + "loss": 0.0164, + "step": 5856 + }, + { + "epoch": 61.0, + "eval_LOCATION_f1": 0.9411764705882353, + "eval_LOCATION_number": 116, + "eval_LOCATION_precision": 0.9180327868852459, + "eval_LOCATION_recall": 0.9655172413793104, + "eval_ORGANIZATION_f1": 0.926984126984127, + "eval_ORGANIZATION_number": 158, + "eval_ORGANIZATION_precision": 0.9299363057324841, + "eval_ORGANIZATION_recall": 0.9240506329113924, + "eval_PERSON_f1": 0.9879518072289156, + "eval_PERSON_number": 124, + "eval_PERSON_precision": 0.984, + "eval_PERSON_recall": 0.9919354838709677, + "eval_loss": 0.047981929033994675, + "eval_overall_accuracy": 0.9879220422728521, + "eval_overall_f1": 0.9501246882793017, + "eval_overall_precision": 0.943069306930693, + "eval_overall_recall": 0.957286432160804, + "eval_runtime": 0.2422, + "eval_samples_per_second": 701.864, + "eval_steps_per_second": 12.386, + "step": 5856 + }, + { + "epoch": 62.0, + "grad_norm": 0.623166024684906, + "learning_rate": 1.9e-05, + "loss": 0.0126, + "step": 5952 + }, + { + "epoch": 62.0, + "eval_LOCATION_f1": 0.925, + "eval_LOCATION_number": 116, + "eval_LOCATION_precision": 0.8951612903225806, + "eval_LOCATION_recall": 0.9568965517241379, + "eval_ORGANIZATION_f1": 0.9102564102564102, + "eval_ORGANIZATION_number": 158, + "eval_ORGANIZATION_precision": 0.922077922077922, + "eval_ORGANIZATION_recall": 0.8987341772151899, + "eval_PERSON_f1": 0.9840000000000001, + "eval_PERSON_number": 124, + "eval_PERSON_precision": 0.9761904761904762, + "eval_PERSON_recall": 0.9919354838709677, + "eval_loss": 0.05383405089378357, + "eval_overall_accuracy": 0.987098545155092, + "eval_overall_f1": 0.9376558603491272, + "eval_overall_precision": 0.9306930693069307, + "eval_overall_recall": 0.9447236180904522, + "eval_runtime": 0.242, + "eval_samples_per_second": 702.589, + "eval_steps_per_second": 12.399, + "step": 5952 + }, + { + "epoch": 63.0, + "grad_norm": 0.06195319816470146, + "learning_rate": 1.85e-05, + "loss": 0.0142, + "step": 6048 + }, + { + "epoch": 63.0, + "eval_LOCATION_f1": 0.9572649572649573, + "eval_LOCATION_number": 116, + "eval_LOCATION_precision": 0.9491525423728814, + "eval_LOCATION_recall": 0.9655172413793104, + "eval_ORGANIZATION_f1": 0.9206349206349206, + "eval_ORGANIZATION_number": 158, + "eval_ORGANIZATION_precision": 0.9235668789808917, + "eval_ORGANIZATION_recall": 0.9177215189873418, + "eval_PERSON_f1": 0.9879518072289156, + "eval_PERSON_number": 124, + "eval_PERSON_precision": 0.984, + "eval_PERSON_recall": 0.9919354838709677, + "eval_loss": 0.050431687384843826, + "eval_overall_accuracy": 0.9887455393906122, + "eval_overall_f1": 0.9523809523809523, + "eval_overall_precision": 0.95, + "eval_overall_recall": 0.9547738693467337, + "eval_runtime": 0.2441, + "eval_samples_per_second": 696.509, + "eval_steps_per_second": 12.291, + "step": 6048 + }, + { + "epoch": 64.0, + "grad_norm": 0.38351964950561523, + "learning_rate": 1.8e-05, + "loss": 0.0131, + "step": 6144 + }, + { + "epoch": 64.0, + "eval_LOCATION_f1": 0.9568965517241379, + "eval_LOCATION_number": 116, + "eval_LOCATION_precision": 0.9568965517241379, + "eval_LOCATION_recall": 0.9568965517241379, + "eval_ORGANIZATION_f1": 0.9463722397476341, + "eval_ORGANIZATION_number": 158, + "eval_ORGANIZATION_precision": 0.9433962264150944, + "eval_ORGANIZATION_recall": 0.9493670886075949, + "eval_PERSON_f1": 0.9800796812749005, + "eval_PERSON_number": 124, + "eval_PERSON_precision": 0.968503937007874, + "eval_PERSON_recall": 0.9919354838709677, + "eval_loss": 0.04740133136510849, + "eval_overall_accuracy": 0.9890200384298655, + "eval_overall_f1": 0.96, + "eval_overall_precision": 0.9552238805970149, + "eval_overall_recall": 0.964824120603015, + "eval_runtime": 0.242, + "eval_samples_per_second": 702.471, + "eval_steps_per_second": 12.397, + "step": 6144 + }, + { + "epoch": 65.0, + "grad_norm": 0.42032256722450256, + "learning_rate": 1.75e-05, + "loss": 0.0144, + "step": 6240 + }, + { + "epoch": 65.0, + "eval_LOCATION_f1": 0.9451476793248945, + "eval_LOCATION_number": 116, + "eval_LOCATION_precision": 0.9256198347107438, + "eval_LOCATION_recall": 0.9655172413793104, + "eval_ORGANIZATION_f1": 0.926517571884984, + "eval_ORGANIZATION_number": 158, + "eval_ORGANIZATION_precision": 0.9354838709677419, + "eval_ORGANIZATION_recall": 0.9177215189873418, + "eval_PERSON_f1": 0.9799196787148594, + "eval_PERSON_number": 124, + "eval_PERSON_precision": 0.976, + "eval_PERSON_recall": 0.9838709677419355, + "eval_loss": 0.05012889206409454, + "eval_overall_accuracy": 0.9876475432335987, + "eval_overall_f1": 0.9486858573216519, + "eval_overall_precision": 0.9451371571072319, + "eval_overall_recall": 0.9522613065326633, + "eval_runtime": 0.2428, + "eval_samples_per_second": 700.183, + "eval_steps_per_second": 12.356, + "step": 6240 + }, + { + "epoch": 66.0, + "grad_norm": 0.6347458362579346, + "learning_rate": 1.7000000000000003e-05, + "loss": 0.0135, + "step": 6336 + }, + { + "epoch": 66.0, + "eval_LOCATION_f1": 0.9446808510638298, + "eval_LOCATION_number": 116, + "eval_LOCATION_precision": 0.9327731092436975, + "eval_LOCATION_recall": 0.9568965517241379, + "eval_ORGANIZATION_f1": 0.9240506329113924, + "eval_ORGANIZATION_number": 158, + "eval_ORGANIZATION_precision": 0.9240506329113924, + "eval_ORGANIZATION_recall": 0.9240506329113924, + "eval_PERSON_f1": 0.9800796812749005, + "eval_PERSON_number": 124, + "eval_PERSON_precision": 0.968503937007874, + "eval_PERSON_recall": 0.9919354838709677, + "eval_loss": 0.05208972468972206, + "eval_overall_accuracy": 0.9876475432335987, + "eval_overall_f1": 0.9476309226932669, + "eval_overall_precision": 0.9405940594059405, + "eval_overall_recall": 0.9547738693467337, + "eval_runtime": 0.2429, + "eval_samples_per_second": 699.867, + "eval_steps_per_second": 12.351, + "step": 6336 + }, + { + "epoch": 67.0, + "grad_norm": 1.0222524404525757, + "learning_rate": 1.65e-05, + "loss": 0.0162, + "step": 6432 + }, + { + "epoch": 67.0, + "eval_LOCATION_f1": 0.9406779661016949, + "eval_LOCATION_number": 116, + "eval_LOCATION_precision": 0.925, + "eval_LOCATION_recall": 0.9568965517241379, + "eval_ORGANIZATION_f1": 0.9201277955271565, + "eval_ORGANIZATION_number": 158, + "eval_ORGANIZATION_precision": 0.9290322580645162, + "eval_ORGANIZATION_recall": 0.9113924050632911, + "eval_PERSON_f1": 0.9800796812749005, + "eval_PERSON_number": 124, + "eval_PERSON_precision": 0.968503937007874, + "eval_PERSON_recall": 0.9919354838709677, + "eval_loss": 0.05340787023305893, + "eval_overall_accuracy": 0.9862750480373319, + "eval_overall_f1": 0.9450000000000001, + "eval_overall_precision": 0.9402985074626866, + "eval_overall_recall": 0.949748743718593, + "eval_runtime": 0.2417, + "eval_samples_per_second": 703.351, + "eval_steps_per_second": 12.412, + "step": 6432 + }, + { + "epoch": 68.0, + "grad_norm": 0.6841771006584167, + "learning_rate": 1.6000000000000003e-05, + "loss": 0.0136, + "step": 6528 + }, + { + "epoch": 68.0, + "eval_LOCATION_f1": 0.9406779661016949, + "eval_LOCATION_number": 116, + "eval_LOCATION_precision": 0.925, + "eval_LOCATION_recall": 0.9568965517241379, + "eval_ORGANIZATION_f1": 0.9363057324840764, + "eval_ORGANIZATION_number": 158, + "eval_ORGANIZATION_precision": 0.9423076923076923, + "eval_ORGANIZATION_recall": 0.930379746835443, + "eval_PERSON_f1": 0.9840000000000001, + "eval_PERSON_number": 124, + "eval_PERSON_precision": 0.9761904761904762, + "eval_PERSON_recall": 0.9919354838709677, + "eval_loss": 0.05373825877904892, + "eval_overall_accuracy": 0.9881965413121054, + "eval_overall_f1": 0.9525, + "eval_overall_precision": 0.9477611940298507, + "eval_overall_recall": 0.957286432160804, + "eval_runtime": 0.2419, + "eval_samples_per_second": 702.784, + "eval_steps_per_second": 12.402, + "step": 6528 + }, + { + "epoch": 69.0, + "grad_norm": 1.1261268854141235, + "learning_rate": 1.55e-05, + "loss": 0.0138, + "step": 6624 + }, + { + "epoch": 69.0, + "eval_LOCATION_f1": 0.9361702127659575, + "eval_LOCATION_number": 116, + "eval_LOCATION_precision": 0.9243697478991597, + "eval_LOCATION_recall": 0.9482758620689655, + "eval_ORGANIZATION_f1": 0.9363057324840764, + "eval_ORGANIZATION_number": 158, + "eval_ORGANIZATION_precision": 0.9423076923076923, + "eval_ORGANIZATION_recall": 0.930379746835443, + "eval_PERSON_f1": 0.9840000000000001, + "eval_PERSON_number": 124, + "eval_PERSON_precision": 0.9761904761904762, + "eval_PERSON_recall": 0.9919354838709677, + "eval_loss": 0.05131537467241287, + "eval_overall_accuracy": 0.9887455393906122, + "eval_overall_f1": 0.951188986232791, + "eval_overall_precision": 0.9476309226932669, + "eval_overall_recall": 0.9547738693467337, + "eval_runtime": 0.2421, + "eval_samples_per_second": 702.112, + "eval_steps_per_second": 12.39, + "step": 6624 + }, + { + "epoch": 70.0, + "grad_norm": 0.47885391116142273, + "learning_rate": 1.5e-05, + "loss": 0.0135, + "step": 6720 + }, + { + "epoch": 70.0, + "eval_LOCATION_f1": 0.9406779661016949, + "eval_LOCATION_number": 116, + "eval_LOCATION_precision": 0.925, + "eval_LOCATION_recall": 0.9568965517241379, + "eval_ORGANIZATION_f1": 0.926984126984127, + "eval_ORGANIZATION_number": 158, + "eval_ORGANIZATION_precision": 0.9299363057324841, + "eval_ORGANIZATION_recall": 0.9240506329113924, + "eval_PERSON_f1": 0.9800796812749005, + "eval_PERSON_number": 124, + "eval_PERSON_precision": 0.968503937007874, + "eval_PERSON_recall": 0.9919354838709677, + "eval_loss": 0.05541845038533211, + "eval_overall_accuracy": 0.987098545155092, + "eval_overall_f1": 0.9476309226932669, + "eval_overall_precision": 0.9405940594059405, + "eval_overall_recall": 0.9547738693467337, + "eval_runtime": 0.2426, + "eval_samples_per_second": 700.621, + "eval_steps_per_second": 12.364, + "step": 6720 + }, + { + "epoch": 71.0, + "grad_norm": 0.29839274287223816, + "learning_rate": 1.45e-05, + "loss": 0.0121, + "step": 6816 + }, + { + "epoch": 71.0, + "eval_LOCATION_f1": 0.9482758620689655, + "eval_LOCATION_number": 116, + "eval_LOCATION_precision": 0.9482758620689655, + "eval_LOCATION_recall": 0.9482758620689655, + "eval_ORGANIZATION_f1": 0.9341692789968652, + "eval_ORGANIZATION_number": 158, + "eval_ORGANIZATION_precision": 0.9254658385093167, + "eval_ORGANIZATION_recall": 0.9430379746835443, + "eval_PERSON_f1": 0.9840000000000001, + "eval_PERSON_number": 124, + "eval_PERSON_precision": 0.9761904761904762, + "eval_PERSON_recall": 0.9919354838709677, + "eval_loss": 0.05237449333071709, + "eval_overall_accuracy": 0.9884710403513588, + "eval_overall_f1": 0.9538077403245941, + "eval_overall_precision": 0.9478908188585607, + "eval_overall_recall": 0.9597989949748744, + "eval_runtime": 0.2432, + "eval_samples_per_second": 698.886, + "eval_steps_per_second": 12.333, + "step": 6816 + }, + { + "epoch": 72.0, + "grad_norm": 1.4181568622589111, + "learning_rate": 1.4000000000000001e-05, + "loss": 0.0131, + "step": 6912 + }, + { + "epoch": 72.0, + "eval_LOCATION_f1": 0.9406779661016949, + "eval_LOCATION_number": 116, + "eval_LOCATION_precision": 0.925, + "eval_LOCATION_recall": 0.9568965517241379, + "eval_ORGANIZATION_f1": 0.9235668789808917, + "eval_ORGANIZATION_number": 158, + "eval_ORGANIZATION_precision": 0.9294871794871795, + "eval_ORGANIZATION_recall": 0.9177215189873418, + "eval_PERSON_f1": 0.9800796812749005, + "eval_PERSON_number": 124, + "eval_PERSON_precision": 0.968503937007874, + "eval_PERSON_recall": 0.9919354838709677, + "eval_loss": 0.05246526002883911, + "eval_overall_accuracy": 0.9881965413121054, + "eval_overall_f1": 0.9463171036204745, + "eval_overall_precision": 0.9404466501240695, + "eval_overall_recall": 0.9522613065326633, + "eval_runtime": 0.2421, + "eval_samples_per_second": 702.097, + "eval_steps_per_second": 12.39, + "step": 6912 + }, + { + "epoch": 73.0, + "grad_norm": 0.5246819853782654, + "learning_rate": 1.3500000000000001e-05, + "loss": 0.0129, + "step": 7008 + }, + { + "epoch": 73.0, + "eval_LOCATION_f1": 0.9322033898305084, + "eval_LOCATION_number": 116, + "eval_LOCATION_precision": 0.9166666666666666, + "eval_LOCATION_recall": 0.9482758620689655, + "eval_ORGANIZATION_f1": 0.926517571884984, + "eval_ORGANIZATION_number": 158, + "eval_ORGANIZATION_precision": 0.9354838709677419, + "eval_ORGANIZATION_recall": 0.9177215189873418, + "eval_PERSON_f1": 0.9721115537848605, + "eval_PERSON_number": 124, + "eval_PERSON_precision": 0.9606299212598425, + "eval_PERSON_recall": 0.9838709677419355, + "eval_loss": 0.05284268409013748, + "eval_overall_accuracy": 0.9876475432335987, + "eval_overall_f1": 0.9425, + "eval_overall_precision": 0.9378109452736318, + "eval_overall_recall": 0.9472361809045227, + "eval_runtime": 0.2425, + "eval_samples_per_second": 701.026, + "eval_steps_per_second": 12.371, + "step": 7008 + }, + { + "epoch": 74.0, + "grad_norm": 0.1629040539264679, + "learning_rate": 1.3000000000000001e-05, + "loss": 0.0118, + "step": 7104 + }, + { + "epoch": 74.0, + "eval_LOCATION_f1": 0.9361702127659575, + "eval_LOCATION_number": 116, + "eval_LOCATION_precision": 0.9243697478991597, + "eval_LOCATION_recall": 0.9482758620689655, + "eval_ORGANIZATION_f1": 0.9329073482428115, + "eval_ORGANIZATION_number": 158, + "eval_ORGANIZATION_precision": 0.9419354838709677, + "eval_ORGANIZATION_recall": 0.9240506329113924, + "eval_PERSON_f1": 0.9721115537848605, + "eval_PERSON_number": 124, + "eval_PERSON_precision": 0.9606299212598425, + "eval_PERSON_recall": 0.9838709677419355, + "eval_loss": 0.05083697289228439, + "eval_overall_accuracy": 0.9884710403513588, + "eval_overall_f1": 0.9461827284105131, + "eval_overall_precision": 0.942643391521197, + "eval_overall_recall": 0.949748743718593, + "eval_runtime": 0.2416, + "eval_samples_per_second": 703.535, + "eval_steps_per_second": 12.415, + "step": 7104 + }, + { + "epoch": 75.0, + "grad_norm": 0.34347105026245117, + "learning_rate": 1.25e-05, + "loss": 0.0109, + "step": 7200 + }, + { + "epoch": 75.0, + "eval_LOCATION_f1": 0.9367088607594937, + "eval_LOCATION_number": 116, + "eval_LOCATION_precision": 0.9173553719008265, + "eval_LOCATION_recall": 0.9568965517241379, + "eval_ORGANIZATION_f1": 0.926517571884984, + "eval_ORGANIZATION_number": 158, + "eval_ORGANIZATION_precision": 0.9354838709677419, + "eval_ORGANIZATION_recall": 0.9177215189873418, + "eval_PERSON_f1": 0.9682539682539683, + "eval_PERSON_number": 124, + "eval_PERSON_precision": 0.953125, + "eval_PERSON_recall": 0.9838709677419355, + "eval_loss": 0.053751371800899506, + "eval_overall_accuracy": 0.9881965413121054, + "eval_overall_f1": 0.9426433915211971, + "eval_overall_precision": 0.9356435643564357, + "eval_overall_recall": 0.949748743718593, + "eval_runtime": 0.2421, + "eval_samples_per_second": 702.067, + "eval_steps_per_second": 12.389, + "step": 7200 + }, + { + "epoch": 76.0, + "grad_norm": 0.0426780991256237, + "learning_rate": 1.2e-05, + "loss": 0.0115, + "step": 7296 + }, + { + "epoch": 76.0, + "eval_LOCATION_f1": 0.9367088607594937, + "eval_LOCATION_number": 116, + "eval_LOCATION_precision": 0.9173553719008265, + "eval_LOCATION_recall": 0.9568965517241379, + "eval_ORGANIZATION_f1": 0.9294871794871796, + "eval_ORGANIZATION_number": 158, + "eval_ORGANIZATION_precision": 0.9415584415584416, + "eval_ORGANIZATION_recall": 0.9177215189873418, + "eval_PERSON_f1": 0.9682539682539683, + "eval_PERSON_number": 124, + "eval_PERSON_precision": 0.953125, + "eval_PERSON_recall": 0.9838709677419355, + "eval_loss": 0.05429477617144585, + "eval_overall_accuracy": 0.9881965413121054, + "eval_overall_f1": 0.9438202247191011, + "eval_overall_precision": 0.9379652605459057, + "eval_overall_recall": 0.949748743718593, + "eval_runtime": 0.2446, + "eval_samples_per_second": 695.028, + "eval_steps_per_second": 12.265, + "step": 7296 + }, + { + "epoch": 77.0, + "grad_norm": 0.332469642162323, + "learning_rate": 1.1500000000000002e-05, + "loss": 0.0121, + "step": 7392 + }, + { + "epoch": 77.0, + "eval_LOCATION_f1": 0.9367088607594937, + "eval_LOCATION_number": 116, + "eval_LOCATION_precision": 0.9173553719008265, + "eval_LOCATION_recall": 0.9568965517241379, + "eval_ORGANIZATION_f1": 0.9201277955271565, + "eval_ORGANIZATION_number": 158, + "eval_ORGANIZATION_precision": 0.9290322580645162, + "eval_ORGANIZATION_recall": 0.9113924050632911, + "eval_PERSON_f1": 0.9721115537848605, + "eval_PERSON_number": 124, + "eval_PERSON_precision": 0.9606299212598425, + "eval_PERSON_recall": 0.9838709677419355, + "eval_loss": 0.05492376908659935, + "eval_overall_accuracy": 0.9873730441943454, + "eval_overall_f1": 0.9413233458177278, + "eval_overall_precision": 0.9354838709677419, + "eval_overall_recall": 0.9472361809045227, + "eval_runtime": 0.242, + "eval_samples_per_second": 702.433, + "eval_steps_per_second": 12.396, + "step": 7392 + }, + { + "epoch": 78.0, + "grad_norm": 0.5249147415161133, + "learning_rate": 1.1000000000000001e-05, + "loss": 0.0116, + "step": 7488 + }, + { + "epoch": 78.0, + "eval_LOCATION_f1": 0.9367088607594937, + "eval_LOCATION_number": 116, + "eval_LOCATION_precision": 0.9173553719008265, + "eval_LOCATION_recall": 0.9568965517241379, + "eval_ORGANIZATION_f1": 0.9044585987261147, + "eval_ORGANIZATION_number": 158, + "eval_ORGANIZATION_precision": 0.9102564102564102, + "eval_ORGANIZATION_recall": 0.8987341772151899, + "eval_PERSON_f1": 0.9721115537848605, + "eval_PERSON_number": 124, + "eval_PERSON_precision": 0.9606299212598425, + "eval_PERSON_recall": 0.9838709677419355, + "eval_loss": 0.05314483493566513, + "eval_overall_accuracy": 0.9862750480373319, + "eval_overall_f1": 0.9351620947630923, + "eval_overall_precision": 0.9282178217821783, + "eval_overall_recall": 0.9422110552763819, + "eval_runtime": 0.2432, + "eval_samples_per_second": 698.87, + "eval_steps_per_second": 12.333, + "step": 7488 + }, + { + "epoch": 79.0, + "grad_norm": 0.028825916349887848, + "learning_rate": 1.05e-05, + "loss": 0.0131, + "step": 7584 + }, + { + "epoch": 79.0, + "eval_LOCATION_f1": 0.944206008583691, + "eval_LOCATION_number": 116, + "eval_LOCATION_precision": 0.9401709401709402, + "eval_LOCATION_recall": 0.9482758620689655, + "eval_ORGANIZATION_f1": 0.9526813880126183, + "eval_ORGANIZATION_number": 158, + "eval_ORGANIZATION_precision": 0.949685534591195, + "eval_ORGANIZATION_recall": 0.9556962025316456, + "eval_PERSON_f1": 0.9800796812749005, + "eval_PERSON_number": 124, + "eval_PERSON_precision": 0.968503937007874, + "eval_PERSON_recall": 0.9919354838709677, + "eval_loss": 0.04911971837282181, + "eval_overall_accuracy": 0.9890200384298655, + "eval_overall_f1": 0.958801498127341, + "eval_overall_precision": 0.9528535980148883, + "eval_overall_recall": 0.964824120603015, + "eval_runtime": 0.2435, + "eval_samples_per_second": 698.29, + "eval_steps_per_second": 12.323, + "step": 7584 + }, + { + "epoch": 80.0, + "grad_norm": 0.19487972557544708, + "learning_rate": 1e-05, + "loss": 0.0113, + "step": 7680 + }, + { + "epoch": 80.0, + "eval_LOCATION_f1": 0.9482758620689655, + "eval_LOCATION_number": 116, + "eval_LOCATION_precision": 0.9482758620689655, + "eval_LOCATION_recall": 0.9482758620689655, + "eval_ORGANIZATION_f1": 0.9085173501577287, + "eval_ORGANIZATION_number": 158, + "eval_ORGANIZATION_precision": 0.9056603773584906, + "eval_ORGANIZATION_recall": 0.9113924050632911, + "eval_PERSON_f1": 0.9761904761904763, + "eval_PERSON_number": 124, + "eval_PERSON_precision": 0.9609375, + "eval_PERSON_recall": 0.9919354838709677, + "eval_loss": 0.05024532973766327, + "eval_overall_accuracy": 0.9873730441943454, + "eval_overall_f1": 0.9413233458177278, + "eval_overall_precision": 0.9354838709677419, + "eval_overall_recall": 0.9472361809045227, + "eval_runtime": 0.2425, + "eval_samples_per_second": 701.107, + "eval_steps_per_second": 12.372, + "step": 7680 + }, + { + "epoch": 81.0, + "grad_norm": 0.2933664619922638, + "learning_rate": 9.5e-06, + "loss": 0.0114, + "step": 7776 + }, + { + "epoch": 81.0, + "eval_LOCATION_f1": 0.9487179487179486, + "eval_LOCATION_number": 116, + "eval_LOCATION_precision": 0.940677966101695, + "eval_LOCATION_recall": 0.9568965517241379, + "eval_ORGANIZATION_f1": 0.9142857142857144, + "eval_ORGANIZATION_number": 158, + "eval_ORGANIZATION_precision": 0.9171974522292994, + "eval_ORGANIZATION_recall": 0.9113924050632911, + "eval_PERSON_f1": 0.9800796812749005, + "eval_PERSON_number": 124, + "eval_PERSON_precision": 0.968503937007874, + "eval_PERSON_recall": 0.9919354838709677, + "eval_loss": 0.050492897629737854, + "eval_overall_accuracy": 0.9881965413121054, + "eval_overall_f1": 0.9450000000000001, + "eval_overall_precision": 0.9402985074626866, + "eval_overall_recall": 0.949748743718593, + "eval_runtime": 0.245, + "eval_samples_per_second": 693.863, + "eval_steps_per_second": 12.245, + "step": 7776 + }, + { + "epoch": 82.0, + "grad_norm": 0.8371833562850952, + "learning_rate": 9e-06, + "loss": 0.0101, + "step": 7872 + }, + { + "epoch": 82.0, + "eval_LOCATION_f1": 0.9446808510638298, + "eval_LOCATION_number": 116, + "eval_LOCATION_precision": 0.9327731092436975, + "eval_LOCATION_recall": 0.9568965517241379, + "eval_ORGANIZATION_f1": 0.9137380191693291, + "eval_ORGANIZATION_number": 158, + "eval_ORGANIZATION_precision": 0.9225806451612903, + "eval_ORGANIZATION_recall": 0.9050632911392406, + "eval_PERSON_f1": 0.9761904761904763, + "eval_PERSON_number": 124, + "eval_PERSON_precision": 0.9609375, + "eval_PERSON_recall": 0.9919354838709677, + "eval_loss": 0.05484500154852867, + "eval_overall_accuracy": 0.987098545155092, + "eval_overall_f1": 0.9425, + "eval_overall_precision": 0.9378109452736318, + "eval_overall_recall": 0.9472361809045227, + "eval_runtime": 0.2414, + "eval_samples_per_second": 704.348, + "eval_steps_per_second": 12.43, + "step": 7872 + }, + { + "epoch": 83.0, + "grad_norm": 0.3084019720554352, + "learning_rate": 8.500000000000002e-06, + "loss": 0.0098, + "step": 7968 + }, + { + "epoch": 83.0, + "eval_LOCATION_f1": 0.9406779661016949, + "eval_LOCATION_number": 116, + "eval_LOCATION_precision": 0.925, + "eval_LOCATION_recall": 0.9568965517241379, + "eval_ORGANIZATION_f1": 0.910828025477707, + "eval_ORGANIZATION_number": 158, + "eval_ORGANIZATION_precision": 0.9166666666666666, + "eval_ORGANIZATION_recall": 0.9050632911392406, + "eval_PERSON_f1": 0.9721115537848605, + "eval_PERSON_number": 124, + "eval_PERSON_precision": 0.9606299212598425, + "eval_PERSON_recall": 0.9838709677419355, + "eval_loss": 0.0543341189622879, + "eval_overall_accuracy": 0.987098545155092, + "eval_overall_f1": 0.9388264669163546, + "eval_overall_precision": 0.9330024813895782, + "eval_overall_recall": 0.9447236180904522, + "eval_runtime": 0.2426, + "eval_samples_per_second": 700.604, + "eval_steps_per_second": 12.364, + "step": 7968 + }, + { + "epoch": 84.0, + "grad_norm": 0.04305460304021835, + "learning_rate": 8.000000000000001e-06, + "loss": 0.01, + "step": 8064 + }, + { + "epoch": 84.0, + "eval_LOCATION_f1": 0.9527896995708154, + "eval_LOCATION_number": 116, + "eval_LOCATION_precision": 0.9487179487179487, + "eval_LOCATION_recall": 0.9568965517241379, + "eval_ORGANIZATION_f1": 0.9299363057324842, + "eval_ORGANIZATION_number": 158, + "eval_ORGANIZATION_precision": 0.9358974358974359, + "eval_ORGANIZATION_recall": 0.9240506329113924, + "eval_PERSON_f1": 0.9800796812749005, + "eval_PERSON_number": 124, + "eval_PERSON_precision": 0.968503937007874, + "eval_PERSON_recall": 0.9919354838709677, + "eval_loss": 0.054905395954847336, + "eval_overall_accuracy": 0.9873730441943454, + "eval_overall_f1": 0.9523809523809523, + "eval_overall_precision": 0.95, + "eval_overall_recall": 0.9547738693467337, + "eval_runtime": 0.2424, + "eval_samples_per_second": 701.305, + "eval_steps_per_second": 12.376, + "step": 8064 + }, + { + "epoch": 85.0, + "grad_norm": 0.7204985022544861, + "learning_rate": 7.5e-06, + "loss": 0.0106, + "step": 8160 + }, + { + "epoch": 85.0, + "eval_LOCATION_f1": 0.9491525423728815, + "eval_LOCATION_number": 116, + "eval_LOCATION_precision": 0.9333333333333333, + "eval_LOCATION_recall": 0.9655172413793104, + "eval_ORGANIZATION_f1": 0.926984126984127, + "eval_ORGANIZATION_number": 158, + "eval_ORGANIZATION_precision": 0.9299363057324841, + "eval_ORGANIZATION_recall": 0.9240506329113924, + "eval_PERSON_f1": 0.9800796812749005, + "eval_PERSON_number": 124, + "eval_PERSON_precision": 0.968503937007874, + "eval_PERSON_recall": 0.9919354838709677, + "eval_loss": 0.05248566344380379, + "eval_overall_accuracy": 0.9890200384298655, + "eval_overall_f1": 0.9501246882793017, + "eval_overall_precision": 0.943069306930693, + "eval_overall_recall": 0.957286432160804, + "eval_runtime": 0.2418, + "eval_samples_per_second": 703.138, + "eval_steps_per_second": 12.408, + "step": 8160 + }, + { + "epoch": 86.0, + "grad_norm": 0.07470478117465973, + "learning_rate": 7.000000000000001e-06, + "loss": 0.0102, + "step": 8256 + }, + { + "epoch": 86.0, + "eval_LOCATION_f1": 0.9487179487179486, + "eval_LOCATION_number": 116, + "eval_LOCATION_precision": 0.940677966101695, + "eval_LOCATION_recall": 0.9568965517241379, + "eval_ORGANIZATION_f1": 0.926984126984127, + "eval_ORGANIZATION_number": 158, + "eval_ORGANIZATION_precision": 0.9299363057324841, + "eval_ORGANIZATION_recall": 0.9240506329113924, + "eval_PERSON_f1": 0.976, + "eval_PERSON_number": 124, + "eval_PERSON_precision": 0.9682539682539683, + "eval_PERSON_recall": 0.9838709677419355, + "eval_loss": 0.05321876332163811, + "eval_overall_accuracy": 0.9879220422728521, + "eval_overall_f1": 0.9486858573216519, + "eval_overall_precision": 0.9451371571072319, + "eval_overall_recall": 0.9522613065326633, + "eval_runtime": 0.2428, + "eval_samples_per_second": 700.282, + "eval_steps_per_second": 12.358, + "step": 8256 + }, + { + "epoch": 87.0, + "grad_norm": 0.2286868691444397, + "learning_rate": 6.5000000000000004e-06, + "loss": 0.0092, + "step": 8352 + }, + { + "epoch": 87.0, + "eval_LOCATION_f1": 0.9367088607594937, + "eval_LOCATION_number": 116, + "eval_LOCATION_precision": 0.9173553719008265, + "eval_LOCATION_recall": 0.9568965517241379, + "eval_ORGANIZATION_f1": 0.9206349206349206, + "eval_ORGANIZATION_number": 158, + "eval_ORGANIZATION_precision": 0.9235668789808917, + "eval_ORGANIZATION_recall": 0.9177215189873418, + "eval_PERSON_f1": 0.976, + "eval_PERSON_number": 124, + "eval_PERSON_precision": 0.9682539682539683, + "eval_PERSON_recall": 0.9838709677419355, + "eval_loss": 0.053863525390625, + "eval_overall_accuracy": 0.9879220422728521, + "eval_overall_f1": 0.9426433915211971, + "eval_overall_precision": 0.9356435643564357, + "eval_overall_recall": 0.949748743718593, + "eval_runtime": 0.2431, + "eval_samples_per_second": 699.324, + "eval_steps_per_second": 12.341, + "step": 8352 + }, + { + "epoch": 88.0, + "grad_norm": 0.19395892322063446, + "learning_rate": 6e-06, + "loss": 0.0095, + "step": 8448 + }, + { + "epoch": 88.0, + "eval_LOCATION_f1": 0.9367088607594937, + "eval_LOCATION_number": 116, + "eval_LOCATION_precision": 0.9173553719008265, + "eval_LOCATION_recall": 0.9568965517241379, + "eval_ORGANIZATION_f1": 0.9299363057324842, + "eval_ORGANIZATION_number": 158, + "eval_ORGANIZATION_precision": 0.9358974358974359, + "eval_ORGANIZATION_recall": 0.9240506329113924, + "eval_PERSON_f1": 0.976, + "eval_PERSON_number": 124, + "eval_PERSON_precision": 0.9682539682539683, + "eval_PERSON_recall": 0.9838709677419355, + "eval_loss": 0.05385447293519974, + "eval_overall_accuracy": 0.9873730441943454, + "eval_overall_f1": 0.9463171036204745, + "eval_overall_precision": 0.9404466501240695, + "eval_overall_recall": 0.9522613065326633, + "eval_runtime": 0.2425, + "eval_samples_per_second": 700.995, + "eval_steps_per_second": 12.37, + "step": 8448 + }, + { + "epoch": 89.0, + "grad_norm": 0.5978826880455017, + "learning_rate": 5.500000000000001e-06, + "loss": 0.0099, + "step": 8544 + }, + { + "epoch": 89.0, + "eval_LOCATION_f1": 0.9406779661016949, + "eval_LOCATION_number": 116, + "eval_LOCATION_precision": 0.925, + "eval_LOCATION_recall": 0.9568965517241379, + "eval_ORGANIZATION_f1": 0.9367088607594937, + "eval_ORGANIZATION_number": 158, + "eval_ORGANIZATION_precision": 0.9367088607594937, + "eval_ORGANIZATION_recall": 0.9367088607594937, + "eval_PERSON_f1": 0.9840000000000001, + "eval_PERSON_number": 124, + "eval_PERSON_precision": 0.9761904761904762, + "eval_PERSON_recall": 0.9919354838709677, + "eval_loss": 0.052636079490184784, + "eval_overall_accuracy": 0.9890200384298655, + "eval_overall_f1": 0.9526184538653367, + "eval_overall_precision": 0.9455445544554455, + "eval_overall_recall": 0.9597989949748744, + "eval_runtime": 0.2422, + "eval_samples_per_second": 702.032, + "eval_steps_per_second": 12.389, + "step": 8544 + }, + { + "epoch": 90.0, + "grad_norm": 0.17808915674686432, + "learning_rate": 5e-06, + "loss": 0.0095, + "step": 8640 + }, + { + "epoch": 90.0, + "eval_LOCATION_f1": 0.9487179487179486, + "eval_LOCATION_number": 116, + "eval_LOCATION_precision": 0.940677966101695, + "eval_LOCATION_recall": 0.9568965517241379, + "eval_ORGANIZATION_f1": 0.9363057324840764, + "eval_ORGANIZATION_number": 158, + "eval_ORGANIZATION_precision": 0.9423076923076923, + "eval_ORGANIZATION_recall": 0.930379746835443, + "eval_PERSON_f1": 0.9800796812749005, + "eval_PERSON_number": 124, + "eval_PERSON_precision": 0.968503937007874, + "eval_PERSON_recall": 0.9919354838709677, + "eval_loss": 0.05316346138715744, + "eval_overall_accuracy": 0.9884710403513588, + "eval_overall_f1": 0.9536921151439299, + "eval_overall_precision": 0.9501246882793017, + "eval_overall_recall": 0.957286432160804, + "eval_runtime": 0.2434, + "eval_samples_per_second": 698.582, + "eval_steps_per_second": 12.328, + "step": 8640 + }, + { + "epoch": 91.0, + "grad_norm": 0.17433640360832214, + "learning_rate": 4.5e-06, + "loss": 0.0099, + "step": 8736 + }, + { + "epoch": 91.0, + "eval_LOCATION_f1": 0.9406779661016949, + "eval_LOCATION_number": 116, + "eval_LOCATION_precision": 0.925, + "eval_LOCATION_recall": 0.9568965517241379, + "eval_ORGANIZATION_f1": 0.9299363057324842, + "eval_ORGANIZATION_number": 158, + "eval_ORGANIZATION_precision": 0.9358974358974359, + "eval_ORGANIZATION_recall": 0.9240506329113924, + "eval_PERSON_f1": 0.9840000000000001, + "eval_PERSON_number": 124, + "eval_PERSON_precision": 0.9761904761904762, + "eval_PERSON_recall": 0.9919354838709677, + "eval_loss": 0.052069030702114105, + "eval_overall_accuracy": 0.9887455393906122, + "eval_overall_f1": 0.95, + "eval_overall_precision": 0.945273631840796, + "eval_overall_recall": 0.9547738693467337, + "eval_runtime": 0.2421, + "eval_samples_per_second": 702.241, + "eval_steps_per_second": 12.392, + "step": 8736 + }, + { + "epoch": 92.0, + "grad_norm": 0.0391317717730999, + "learning_rate": 4.000000000000001e-06, + "loss": 0.0095, + "step": 8832 + }, + { + "epoch": 92.0, + "eval_LOCATION_f1": 0.9406779661016949, + "eval_LOCATION_number": 116, + "eval_LOCATION_precision": 0.925, + "eval_LOCATION_recall": 0.9568965517241379, + "eval_ORGANIZATION_f1": 0.9240506329113924, + "eval_ORGANIZATION_number": 158, + "eval_ORGANIZATION_precision": 0.9240506329113924, + "eval_ORGANIZATION_recall": 0.9240506329113924, + "eval_PERSON_f1": 0.976, + "eval_PERSON_number": 124, + "eval_PERSON_precision": 0.9682539682539683, + "eval_PERSON_recall": 0.9838709677419355, + "eval_loss": 0.05470087379217148, + "eval_overall_accuracy": 0.9879220422728521, + "eval_overall_f1": 0.9451371571072318, + "eval_overall_precision": 0.9381188118811881, + "eval_overall_recall": 0.9522613065326633, + "eval_runtime": 0.2418, + "eval_samples_per_second": 702.995, + "eval_steps_per_second": 12.406, + "step": 8832 + }, + { + "epoch": 93.0, + "grad_norm": 1.2939667701721191, + "learning_rate": 3.5000000000000004e-06, + "loss": 0.0096, + "step": 8928 + }, + { + "epoch": 93.0, + "eval_LOCATION_f1": 0.9487179487179486, + "eval_LOCATION_number": 116, + "eval_LOCATION_precision": 0.940677966101695, + "eval_LOCATION_recall": 0.9568965517241379, + "eval_ORGANIZATION_f1": 0.9299363057324842, + "eval_ORGANIZATION_number": 158, + "eval_ORGANIZATION_precision": 0.9358974358974359, + "eval_ORGANIZATION_recall": 0.9240506329113924, + "eval_PERSON_f1": 0.9721115537848605, + "eval_PERSON_number": 124, + "eval_PERSON_precision": 0.9606299212598425, + "eval_PERSON_recall": 0.9838709677419355, + "eval_loss": 0.05360059067606926, + "eval_overall_accuracy": 0.9884710403513588, + "eval_overall_f1": 0.9486858573216519, + "eval_overall_precision": 0.9451371571072319, + "eval_overall_recall": 0.9522613065326633, + "eval_runtime": 0.2419, + "eval_samples_per_second": 702.744, + "eval_steps_per_second": 12.401, + "step": 8928 + }, + { + "epoch": 94.0, + "grad_norm": 1.3997987508773804, + "learning_rate": 3e-06, + "loss": 0.009, + "step": 9024 + }, + { + "epoch": 94.0, + "eval_LOCATION_f1": 0.9446808510638298, + "eval_LOCATION_number": 116, + "eval_LOCATION_precision": 0.9327731092436975, + "eval_LOCATION_recall": 0.9568965517241379, + "eval_ORGANIZATION_f1": 0.9235668789808917, + "eval_ORGANIZATION_number": 158, + "eval_ORGANIZATION_precision": 0.9294871794871795, + "eval_ORGANIZATION_recall": 0.9177215189873418, + "eval_PERSON_f1": 0.9800796812749005, + "eval_PERSON_number": 124, + "eval_PERSON_precision": 0.968503937007874, + "eval_PERSON_recall": 0.9919354838709677, + "eval_loss": 0.053766991943120956, + "eval_overall_accuracy": 0.9884710403513588, + "eval_overall_f1": 0.9475, + "eval_overall_precision": 0.9427860696517413, + "eval_overall_recall": 0.9522613065326633, + "eval_runtime": 0.2419, + "eval_samples_per_second": 702.867, + "eval_steps_per_second": 12.404, + "step": 9024 + }, + { + "epoch": 95.0, + "grad_norm": 0.015623769722878933, + "learning_rate": 2.5e-06, + "loss": 0.0094, + "step": 9120 + }, + { + "epoch": 95.0, + "eval_LOCATION_f1": 0.9406779661016949, + "eval_LOCATION_number": 116, + "eval_LOCATION_precision": 0.925, + "eval_LOCATION_recall": 0.9568965517241379, + "eval_ORGANIZATION_f1": 0.926517571884984, + "eval_ORGANIZATION_number": 158, + "eval_ORGANIZATION_precision": 0.9354838709677419, + "eval_ORGANIZATION_recall": 0.9177215189873418, + "eval_PERSON_f1": 0.9840000000000001, + "eval_PERSON_number": 124, + "eval_PERSON_precision": 0.9761904761904762, + "eval_PERSON_recall": 0.9919354838709677, + "eval_loss": 0.05312187969684601, + "eval_overall_accuracy": 0.9887455393906122, + "eval_overall_f1": 0.9486858573216519, + "eval_overall_precision": 0.9451371571072319, + "eval_overall_recall": 0.9522613065326633, + "eval_runtime": 0.2423, + "eval_samples_per_second": 701.669, + "eval_steps_per_second": 12.382, + "step": 9120 + }, + { + "epoch": 96.0, + "grad_norm": 0.06812173873186111, + "learning_rate": 2.0000000000000003e-06, + "loss": 0.0083, + "step": 9216 + }, + { + "epoch": 96.0, + "eval_LOCATION_f1": 0.9406779661016949, + "eval_LOCATION_number": 116, + "eval_LOCATION_precision": 0.925, + "eval_LOCATION_recall": 0.9568965517241379, + "eval_ORGANIZATION_f1": 0.9235668789808917, + "eval_ORGANIZATION_number": 158, + "eval_ORGANIZATION_precision": 0.9294871794871795, + "eval_ORGANIZATION_recall": 0.9177215189873418, + "eval_PERSON_f1": 0.9840000000000001, + "eval_PERSON_number": 124, + "eval_PERSON_precision": 0.9761904761904762, + "eval_PERSON_recall": 0.9919354838709677, + "eval_loss": 0.052705731242895126, + "eval_overall_accuracy": 0.9887455393906122, + "eval_overall_f1": 0.9475, + "eval_overall_precision": 0.9427860696517413, + "eval_overall_recall": 0.9522613065326633, + "eval_runtime": 0.2425, + "eval_samples_per_second": 701.06, + "eval_steps_per_second": 12.372, + "step": 9216 + }, + { + "epoch": 97.0, + "grad_norm": 0.13947905600070953, + "learning_rate": 1.5e-06, + "loss": 0.0099, + "step": 9312 + }, + { + "epoch": 97.0, + "eval_LOCATION_f1": 0.9406779661016949, + "eval_LOCATION_number": 116, + "eval_LOCATION_precision": 0.925, + "eval_LOCATION_recall": 0.9568965517241379, + "eval_ORGANIZATION_f1": 0.926517571884984, + "eval_ORGANIZATION_number": 158, + "eval_ORGANIZATION_precision": 0.9354838709677419, + "eval_ORGANIZATION_recall": 0.9177215189873418, + "eval_PERSON_f1": 0.9840000000000001, + "eval_PERSON_number": 124, + "eval_PERSON_precision": 0.9761904761904762, + "eval_PERSON_recall": 0.9919354838709677, + "eval_loss": 0.05367732793092728, + "eval_overall_accuracy": 0.9890200384298655, + "eval_overall_f1": 0.9486858573216519, + "eval_overall_precision": 0.9451371571072319, + "eval_overall_recall": 0.9522613065326633, + "eval_runtime": 0.2429, + "eval_samples_per_second": 699.966, + "eval_steps_per_second": 12.352, + "step": 9312 + }, + { + "epoch": 98.0, + "grad_norm": 0.10114230960607529, + "learning_rate": 1.0000000000000002e-06, + "loss": 0.0078, + "step": 9408 + }, + { + "epoch": 98.0, + "eval_LOCATION_f1": 0.9406779661016949, + "eval_LOCATION_number": 116, + "eval_LOCATION_precision": 0.925, + "eval_LOCATION_recall": 0.9568965517241379, + "eval_ORGANIZATION_f1": 0.926517571884984, + "eval_ORGANIZATION_number": 158, + "eval_ORGANIZATION_precision": 0.9354838709677419, + "eval_ORGANIZATION_recall": 0.9177215189873418, + "eval_PERSON_f1": 0.9840000000000001, + "eval_PERSON_number": 124, + "eval_PERSON_precision": 0.9761904761904762, + "eval_PERSON_recall": 0.9919354838709677, + "eval_loss": 0.05298721790313721, + "eval_overall_accuracy": 0.9892945374691189, + "eval_overall_f1": 0.9486858573216519, + "eval_overall_precision": 0.9451371571072319, + "eval_overall_recall": 0.9522613065326633, + "eval_runtime": 0.2421, + "eval_samples_per_second": 702.26, + "eval_steps_per_second": 12.393, + "step": 9408 + }, + { + "epoch": 99.0, + "grad_norm": 0.5689762234687805, + "learning_rate": 5.000000000000001e-07, + "loss": 0.0093, + "step": 9504 + }, + { + "epoch": 99.0, + "eval_LOCATION_f1": 0.9406779661016949, + "eval_LOCATION_number": 116, + "eval_LOCATION_precision": 0.925, + "eval_LOCATION_recall": 0.9568965517241379, + "eval_ORGANIZATION_f1": 0.926517571884984, + "eval_ORGANIZATION_number": 158, + "eval_ORGANIZATION_precision": 0.9354838709677419, + "eval_ORGANIZATION_recall": 0.9177215189873418, + "eval_PERSON_f1": 0.9840000000000001, + "eval_PERSON_number": 124, + "eval_PERSON_precision": 0.9761904761904762, + "eval_PERSON_recall": 0.9919354838709677, + "eval_loss": 0.052819643169641495, + "eval_overall_accuracy": 0.9892945374691189, + "eval_overall_f1": 0.9486858573216519, + "eval_overall_precision": 0.9451371571072319, + "eval_overall_recall": 0.9522613065326633, + "eval_runtime": 0.2426, + "eval_samples_per_second": 700.726, + "eval_steps_per_second": 12.366, + "step": 9504 + }, + { + "epoch": 100.0, + "grad_norm": 0.09888800233602524, + "learning_rate": 0.0, + "loss": 0.0086, + "step": 9600 + }, + { + "epoch": 100.0, + "eval_LOCATION_f1": 0.9406779661016949, + "eval_LOCATION_number": 116, + "eval_LOCATION_precision": 0.925, + "eval_LOCATION_recall": 0.9568965517241379, + "eval_ORGANIZATION_f1": 0.926517571884984, + "eval_ORGANIZATION_number": 158, + "eval_ORGANIZATION_precision": 0.9354838709677419, + "eval_ORGANIZATION_recall": 0.9177215189873418, + "eval_PERSON_f1": 0.9840000000000001, + "eval_PERSON_number": 124, + "eval_PERSON_precision": 0.9761904761904762, + "eval_PERSON_recall": 0.9919354838709677, + "eval_loss": 0.052767641842365265, + "eval_overall_accuracy": 0.9895690365083722, + "eval_overall_f1": 0.9486858573216519, + "eval_overall_precision": 0.9451371571072319, + "eval_overall_recall": 0.9522613065326633, + "eval_runtime": 0.2425, + "eval_samples_per_second": 701.096, + "eval_steps_per_second": 12.372, + "step": 9600 + }, + { + "epoch": 100.0, + "step": 9600, + "total_flos": 4293597283743744.0, + "train_loss": 0.04076442163437605, + "train_runtime": 503.1696, + "train_samples_per_second": 304.271, + "train_steps_per_second": 19.079 + } + ], + "logging_steps": 500, + "max_steps": 9600, + "num_input_tokens_seen": 0, + "num_train_epochs": 100, + "save_steps": 500, + "total_flos": 4293597283743744.0, + "train_batch_size": 16, + "trial_name": null, + "trial_params": null +}