{ "best_metric": 0.21482913196086884, "best_model_checkpoint": "/content/results/checkpoint-64059", "epoch": 15.0, "global_step": 320295, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 0.02, "learning_rate": 9.984389391030145e-06, "loss": 1.0634, "step": 500 }, { "epoch": 0.05, "learning_rate": 9.968778782060289e-06, "loss": 0.7186, "step": 1000 }, { "epoch": 0.07, "learning_rate": 9.953168173090433e-06, "loss": 0.6235, "step": 1500 }, { "epoch": 0.09, "learning_rate": 9.937557564120577e-06, "loss": 0.5584, "step": 2000 }, { "epoch": 0.12, "learning_rate": 9.921946955150721e-06, "loss": 0.5133, "step": 2500 }, { "epoch": 0.14, "learning_rate": 9.906336346180865e-06, "loss": 0.4825, "step": 3000 }, { "epoch": 0.16, "learning_rate": 9.890725737211009e-06, "loss": 0.4586, "step": 3500 }, { "epoch": 0.19, "learning_rate": 9.875115128241153e-06, "loss": 0.4298, "step": 4000 }, { "epoch": 0.21, "learning_rate": 9.859504519271297e-06, "loss": 0.4393, "step": 4500 }, { "epoch": 0.23, "learning_rate": 9.843893910301441e-06, "loss": 0.4019, "step": 5000 }, { "epoch": 0.26, "learning_rate": 9.828283301331585e-06, "loss": 0.3991, "step": 5500 }, { "epoch": 0.28, "learning_rate": 9.81267269236173e-06, "loss": 0.3994, "step": 6000 }, { "epoch": 0.3, "learning_rate": 9.797062083391873e-06, "loss": 0.3823, "step": 6500 }, { "epoch": 0.33, "learning_rate": 9.781451474422017e-06, "loss": 0.3674, "step": 7000 }, { "epoch": 0.35, "learning_rate": 9.765840865452161e-06, "loss": 0.3547, "step": 7500 }, { "epoch": 0.37, "learning_rate": 9.750230256482306e-06, "loss": 0.3762, "step": 8000 }, { "epoch": 0.4, "learning_rate": 9.73461964751245e-06, "loss": 0.3506, "step": 8500 }, { "epoch": 0.42, "learning_rate": 9.719009038542594e-06, "loss": 0.3532, "step": 9000 }, { "epoch": 0.44, "learning_rate": 9.703398429572738e-06, "loss": 0.3343, "step": 9500 }, { "epoch": 0.47, "learning_rate": 9.687787820602883e-06, "loss": 0.3463, "step": 10000 }, { "epoch": 0.49, "learning_rate": 9.672177211633027e-06, "loss": 0.333, "step": 10500 }, { "epoch": 0.52, "learning_rate": 9.656566602663172e-06, "loss": 0.3357, "step": 11000 }, { "epoch": 0.54, "learning_rate": 9.640955993693316e-06, "loss": 0.3295, "step": 11500 }, { "epoch": 0.56, "learning_rate": 9.62534538472346e-06, "loss": 0.3241, "step": 12000 }, { "epoch": 0.59, "learning_rate": 9.609734775753604e-06, "loss": 0.3194, "step": 12500 }, { "epoch": 0.61, "learning_rate": 9.594124166783748e-06, "loss": 0.3139, "step": 13000 }, { "epoch": 0.63, "learning_rate": 9.578513557813892e-06, "loss": 0.3162, "step": 13500 }, { "epoch": 0.66, "learning_rate": 9.562902948844036e-06, "loss": 0.301, "step": 14000 }, { "epoch": 0.68, "learning_rate": 9.54729233987418e-06, "loss": 0.3104, "step": 14500 }, { "epoch": 0.7, "learning_rate": 9.531681730904324e-06, "loss": 0.3152, "step": 15000 }, { "epoch": 0.73, "learning_rate": 9.516071121934466e-06, "loss": 0.2961, "step": 15500 }, { "epoch": 0.75, "learning_rate": 9.50046051296461e-06, "loss": 0.2985, "step": 16000 }, { "epoch": 0.77, "learning_rate": 9.484849903994756e-06, "loss": 0.2976, "step": 16500 }, { "epoch": 0.8, "learning_rate": 9.4692392950249e-06, "loss": 0.3076, "step": 17000 }, { "epoch": 0.82, "learning_rate": 9.453628686055044e-06, "loss": 0.2985, "step": 17500 }, { "epoch": 0.84, "learning_rate": 9.438018077085188e-06, "loss": 0.2954, "step": 18000 }, { "epoch": 0.87, "learning_rate": 9.422407468115332e-06, "loss": 0.2861, "step": 18500 }, { "epoch": 0.89, "learning_rate": 9.406796859145476e-06, "loss": 0.2777, "step": 19000 }, { "epoch": 0.91, "learning_rate": 9.39118625017562e-06, "loss": 0.2865, "step": 19500 }, { "epoch": 0.94, "learning_rate": 9.375575641205764e-06, "loss": 0.2864, "step": 20000 }, { "epoch": 0.96, "learning_rate": 9.359965032235908e-06, "loss": 0.2872, "step": 20500 }, { "epoch": 0.98, "learning_rate": 9.344354423266052e-06, "loss": 0.2881, "step": 21000 }, { "epoch": 1.0, "eval_AerospaceManufacturer_f1": 0.5919003115264798, "eval_AerospaceManufacturer_number": 138, "eval_AerospaceManufacturer_precision": 0.5191256830601093, "eval_AerospaceManufacturer_recall": 0.6884057971014492, "eval_AnatomicalStructure_f1": 0.6227544910179641, "eval_AnatomicalStructure_number": 227, "eval_AnatomicalStructure_precision": 0.5693430656934306, "eval_AnatomicalStructure_recall": 0.6872246696035242, "eval_ArtWork_f1": 0.45421245421245415, "eval_ArtWork_number": 131, "eval_ArtWork_precision": 0.43661971830985913, "eval_ArtWork_recall": 0.4732824427480916, "eval_Artist_f1": 0.755240947454397, "eval_Artist_number": 1722, "eval_Artist_precision": 0.7109174782162994, "eval_Artist_recall": 0.8054587688734031, "eval_Athlete_f1": 0.6791666666666666, "eval_Athlete_number": 719, "eval_Athlete_precision": 0.6782246879334258, "eval_Athlete_recall": 0.6801112656467315, "eval_CarManufacturer_f1": 0.6846846846846846, "eval_CarManufacturer_number": 159, "eval_CarManufacturer_precision": 0.6551724137931034, "eval_CarManufacturer_recall": 0.7169811320754716, "eval_Cleric_f1": 0.485, "eval_Cleric_number": 201, "eval_Cleric_precision": 0.48743718592964824, "eval_Cleric_recall": 0.48258706467661694, "eval_Clothing_f1": 0.5238095238095238, "eval_Clothing_number": 128, "eval_Clothing_precision": 0.463855421686747, "eval_Clothing_recall": 0.6015625, "eval_Disease_f1": 0.5766129032258064, "eval_Disease_number": 198, "eval_Disease_precision": 0.4798657718120805, "eval_Disease_recall": 0.7222222222222222, "eval_Drink_f1": 0.6130030959752323, "eval_Drink_number": 143, "eval_Drink_precision": 0.55, "eval_Drink_recall": 0.6923076923076923, "eval_Facility_f1": 0.5898123324396783, "eval_Facility_number": 497, "eval_Facility_precision": 0.5305466237942122, "eval_Facility_recall": 0.6639839034205232, "eval_Food_f1": 0.5176470588235295, "eval_Food_number": 214, "eval_Food_precision": 0.4041994750656168, "eval_Food_recall": 0.719626168224299, "eval_HumanSettlement_f1": 0.8466362599771949, "eval_HumanSettlement_number": 1689, "eval_HumanSettlement_precision": 0.8163826278174822, "eval_HumanSettlement_recall": 0.8792184724689165, "eval_MedicalProcedure_f1": 0.6302250803858521, "eval_MedicalProcedure_number": 142, "eval_MedicalProcedure_precision": 0.5798816568047337, "eval_MedicalProcedure_recall": 0.6901408450704225, "eval_Medication/Vaccine_f1": 0.6651982378854626, "eval_Medication/Vaccine_number": 200, "eval_Medication/Vaccine_precision": 0.594488188976378, "eval_Medication/Vaccine_recall": 0.755, "eval_MusicalGRP_f1": 0.6897546897546898, "eval_MusicalGRP_number": 372, "eval_MusicalGRP_precision": 0.7445482866043613, "eval_MusicalGRP_recall": 0.6424731182795699, "eval_MusicalWork_f1": 0.665024630541872, "eval_MusicalWork_number": 407, "eval_MusicalWork_precision": 0.6666666666666666, "eval_MusicalWork_recall": 0.6633906633906634, "eval_ORG_f1": 0.5618479880774963, "eval_ORG_number": 667, "eval_ORG_precision": 0.5585185185185185, "eval_ORG_recall": 0.5652173913043478, "eval_OtherLOC_f1": 0.5879396984924624, "eval_OtherLOC_number": 224, "eval_OtherLOC_precision": 0.6724137931034483, "eval_OtherLOC_recall": 0.5223214285714286, "eval_OtherPER_f1": 0.42531120331950206, "eval_OtherPER_number": 859, "eval_OtherPER_precision": 0.38353601496725914, "eval_OtherPER_recall": 0.47729918509895225, "eval_OtherPROD_f1": 0.48954489544895446, "eval_OtherPROD_number": 433, "eval_OtherPROD_precision": 0.5236842105263158, "eval_OtherPROD_recall": 0.45958429561200925, "eval_Politician_f1": 0.4895104895104895, "eval_Politician_number": 603, "eval_Politician_precision": 0.5175600739371534, "eval_Politician_recall": 0.46434494195688225, "eval_PrivateCorp_f1": 0.18633540372670807, "eval_PrivateCorp_number": 129, "eval_PrivateCorp_precision": 0.46875, "eval_PrivateCorp_recall": 0.11627906976744186, "eval_PublicCorp_f1": 0.49491525423728816, "eval_PublicCorp_number": 243, "eval_PublicCorp_precision": 0.4207492795389049, "eval_PublicCorp_recall": 0.6008230452674898, "eval_Scientist_f1": 0.3771428571428571, "eval_Scientist_number": 189, "eval_Scientist_precision": 0.40993788819875776, "eval_Scientist_recall": 0.3492063492063492, "eval_Software_f1": 0.7007751937984495, "eval_Software_number": 307, "eval_Software_precision": 0.6686390532544378, "eval_Software_recall": 0.7361563517915309, "eval_SportsGRP_f1": 0.7816091954022988, "eval_SportsGRP_number": 385, "eval_SportsGRP_precision": 0.7688442211055276, "eval_SportsGRP_recall": 0.7948051948051948, "eval_SportsManager_f1": 0.5458937198067633, "eval_SportsManager_number": 194, "eval_SportsManager_precision": 0.5136363636363637, "eval_SportsManager_recall": 0.5824742268041238, "eval_Station_f1": 0.7289719626168224, "eval_Station_number": 194, "eval_Station_precision": 0.6666666666666666, "eval_Station_recall": 0.8041237113402062, "eval_Symptom_f1": 0.2331288343558282, "eval_Symptom_number": 129, "eval_Symptom_precision": 0.5588235294117647, "eval_Symptom_recall": 0.14728682170542637, "eval_Vehicle_f1": 0.5093457943925234, "eval_Vehicle_number": 206, "eval_Vehicle_precision": 0.49099099099099097, "eval_Vehicle_recall": 0.529126213592233, "eval_VisualWork_f1": 0.7051630434782609, "eval_VisualWork_number": 693, "eval_VisualWork_precision": 0.6662387676508345, "eval_VisualWork_recall": 0.7489177489177489, "eval_WrittenWork_f1": 0.601640838650866, "eval_WrittenWork_number": 563, "eval_WrittenWork_precision": 0.6179775280898876, "eval_WrittenWork_recall": 0.5861456483126111, "eval_loss": 0.2534053325653076, "eval_overall_accuracy": 0.9220013874684423, "eval_overall_f1": 0.6377878853512382, "eval_overall_precision": 0.613600055567132, "eval_overall_recall": 0.6639609169485156, "eval_runtime": 45.6015, "eval_samples_per_second": 195.059, "eval_steps_per_second": 24.385, "step": 21353 }, { "epoch": 1.01, "learning_rate": 9.328743814296196e-06, "loss": 0.2759, "step": 21500 }, { "epoch": 1.03, "learning_rate": 9.31313320532634e-06, "loss": 0.2471, "step": 22000 }, { "epoch": 1.05, "learning_rate": 9.297522596356485e-06, "loss": 0.252, "step": 22500 }, { "epoch": 1.08, "learning_rate": 9.281911987386629e-06, "loss": 0.2423, "step": 23000 }, { "epoch": 1.1, "learning_rate": 9.266301378416773e-06, "loss": 0.2475, "step": 23500 }, { "epoch": 1.12, "learning_rate": 9.250690769446917e-06, "loss": 0.2464, "step": 24000 }, { "epoch": 1.15, "learning_rate": 9.23508016047706e-06, "loss": 0.2467, "step": 24500 }, { "epoch": 1.17, "learning_rate": 9.219469551507205e-06, "loss": 0.2535, "step": 25000 }, { "epoch": 1.19, "learning_rate": 9.203858942537349e-06, "loss": 0.248, "step": 25500 }, { "epoch": 1.22, "learning_rate": 9.188248333567493e-06, "loss": 0.2424, "step": 26000 }, { "epoch": 1.24, "learning_rate": 9.172637724597637e-06, "loss": 0.2362, "step": 26500 }, { "epoch": 1.26, "learning_rate": 9.157027115627781e-06, "loss": 0.2491, "step": 27000 }, { "epoch": 1.29, "learning_rate": 9.141416506657925e-06, "loss": 0.2411, "step": 27500 }, { "epoch": 1.31, "learning_rate": 9.125805897688069e-06, "loss": 0.2441, "step": 28000 }, { "epoch": 1.33, "learning_rate": 9.110195288718213e-06, "loss": 0.2449, "step": 28500 }, { "epoch": 1.36, "learning_rate": 9.094584679748357e-06, "loss": 0.2466, "step": 29000 }, { "epoch": 1.38, "learning_rate": 9.078974070778503e-06, "loss": 0.2388, "step": 29500 }, { "epoch": 1.4, "learning_rate": 9.063363461808647e-06, "loss": 0.2449, "step": 30000 }, { "epoch": 1.43, "learning_rate": 9.047752852838791e-06, "loss": 0.2475, "step": 30500 }, { "epoch": 1.45, "learning_rate": 9.032142243868935e-06, "loss": 0.2421, "step": 31000 }, { "epoch": 1.48, "learning_rate": 9.016531634899079e-06, "loss": 0.2416, "step": 31500 }, { "epoch": 1.5, "learning_rate": 9.000921025929223e-06, "loss": 0.2389, "step": 32000 }, { "epoch": 1.52, "learning_rate": 8.985310416959367e-06, "loss": 0.2353, "step": 32500 }, { "epoch": 1.55, "learning_rate": 8.96969980798951e-06, "loss": 0.2405, "step": 33000 }, { "epoch": 1.57, "learning_rate": 8.954089199019654e-06, "loss": 0.2348, "step": 33500 }, { "epoch": 1.59, "learning_rate": 8.938478590049798e-06, "loss": 0.2405, "step": 34000 }, { "epoch": 1.62, "learning_rate": 8.922867981079942e-06, "loss": 0.2234, "step": 34500 }, { "epoch": 1.64, "learning_rate": 8.907257372110086e-06, "loss": 0.2339, "step": 35000 }, { "epoch": 1.66, "learning_rate": 8.89164676314023e-06, "loss": 0.2307, "step": 35500 }, { "epoch": 1.69, "learning_rate": 8.876036154170375e-06, "loss": 0.2213, "step": 36000 }, { "epoch": 1.71, "learning_rate": 8.86042554520052e-06, "loss": 0.2251, "step": 36500 }, { "epoch": 1.73, "learning_rate": 8.844814936230664e-06, "loss": 0.2234, "step": 37000 }, { "epoch": 1.76, "learning_rate": 8.829204327260808e-06, "loss": 0.2324, "step": 37500 }, { "epoch": 1.78, "learning_rate": 8.813593718290952e-06, "loss": 0.2349, "step": 38000 }, { "epoch": 1.8, "learning_rate": 8.797983109321096e-06, "loss": 0.2264, "step": 38500 }, { "epoch": 1.83, "learning_rate": 8.78237250035124e-06, "loss": 0.2415, "step": 39000 }, { "epoch": 1.85, "learning_rate": 8.766761891381384e-06, "loss": 0.2315, "step": 39500 }, { "epoch": 1.87, "learning_rate": 8.751151282411528e-06, "loss": 0.2267, "step": 40000 }, { "epoch": 1.9, "learning_rate": 8.735540673441672e-06, "loss": 0.2186, "step": 40500 }, { "epoch": 1.92, "learning_rate": 8.719930064471816e-06, "loss": 0.2262, "step": 41000 }, { "epoch": 1.94, "learning_rate": 8.70431945550196e-06, "loss": 0.2288, "step": 41500 }, { "epoch": 1.97, "learning_rate": 8.688708846532104e-06, "loss": 0.2339, "step": 42000 }, { "epoch": 1.99, "learning_rate": 8.673098237562248e-06, "loss": 0.2195, "step": 42500 }, { "epoch": 2.0, "eval_AerospaceManufacturer_f1": 0.7272727272727273, "eval_AerospaceManufacturer_number": 138, "eval_AerospaceManufacturer_precision": 0.6408839779005525, "eval_AerospaceManufacturer_recall": 0.8405797101449275, "eval_AnatomicalStructure_f1": 0.6589861751152074, "eval_AnatomicalStructure_number": 227, "eval_AnatomicalStructure_precision": 0.6908212560386473, "eval_AnatomicalStructure_recall": 0.6299559471365639, "eval_ArtWork_f1": 0.555984555984556, "eval_ArtWork_number": 131, "eval_ArtWork_precision": 0.5625, "eval_ArtWork_recall": 0.549618320610687, "eval_Artist_f1": 0.7710112978782033, "eval_Artist_number": 1722, "eval_Artist_precision": 0.7336130047194547, "eval_Artist_recall": 0.8124274099883856, "eval_Athlete_f1": 0.7178217821782178, "eval_Athlete_number": 719, "eval_Athlete_precision": 0.6465997770345596, "eval_Athlete_recall": 0.8066759388038943, "eval_CarManufacturer_f1": 0.6937669376693767, "eval_CarManufacturer_number": 159, "eval_CarManufacturer_precision": 0.6095238095238096, "eval_CarManufacturer_recall": 0.8050314465408805, "eval_Cleric_f1": 0.5376344086021506, "eval_Cleric_number": 201, "eval_Cleric_precision": 0.5847953216374269, "eval_Cleric_recall": 0.4975124378109453, "eval_Clothing_f1": 0.574468085106383, "eval_Clothing_number": 128, "eval_Clothing_precision": 0.525974025974026, "eval_Clothing_recall": 0.6328125, "eval_Disease_f1": 0.587962962962963, "eval_Disease_number": 198, "eval_Disease_precision": 0.5427350427350427, "eval_Disease_recall": 0.6414141414141414, "eval_Drink_f1": 0.7017543859649124, "eval_Drink_number": 143, "eval_Drink_precision": 0.704225352112676, "eval_Drink_recall": 0.6993006993006993, "eval_Facility_f1": 0.6604477611940299, "eval_Facility_number": 497, "eval_Facility_precision": 0.6156521739130435, "eval_Facility_recall": 0.7122736418511066, "eval_Food_f1": 0.5454545454545454, "eval_Food_number": 214, "eval_Food_precision": 0.6140350877192983, "eval_Food_recall": 0.49065420560747663, "eval_HumanSettlement_f1": 0.8597206053550639, "eval_HumanSettlement_number": 1689, "eval_HumanSettlement_precision": 0.8454493417286777, "eval_HumanSettlement_recall": 0.8744819419775015, "eval_MedicalProcedure_f1": 0.6490066225165563, "eval_MedicalProcedure_number": 142, "eval_MedicalProcedure_precision": 0.6125, "eval_MedicalProcedure_recall": 0.6901408450704225, "eval_Medication/Vaccine_f1": 0.7163461538461539, "eval_Medication/Vaccine_number": 200, "eval_Medication/Vaccine_precision": 0.6898148148148148, "eval_Medication/Vaccine_recall": 0.745, "eval_MusicalGRP_f1": 0.7319034852546917, "eval_MusicalGRP_number": 372, "eval_MusicalGRP_precision": 0.7299465240641712, "eval_MusicalGRP_recall": 0.7338709677419355, "eval_MusicalWork_f1": 0.7058823529411764, "eval_MusicalWork_number": 407, "eval_MusicalWork_precision": 0.6901408450704225, "eval_MusicalWork_recall": 0.7223587223587223, "eval_ORG_f1": 0.6061538461538463, "eval_ORG_number": 667, "eval_ORG_precision": 0.6224328593996841, "eval_ORG_recall": 0.5907046476761619, "eval_OtherLOC_f1": 0.6634146341463415, "eval_OtherLOC_number": 224, "eval_OtherLOC_precision": 0.7311827956989247, "eval_OtherLOC_recall": 0.6071428571428571, "eval_OtherPER_f1": 0.48000000000000004, "eval_OtherPER_number": 859, "eval_OtherPER_precision": 0.48513674197384066, "eval_OtherPER_recall": 0.47497089639115253, "eval_OtherPROD_f1": 0.5333333333333333, "eval_OtherPROD_number": 433, "eval_OtherPROD_precision": 0.5994236311239193, "eval_OtherPROD_recall": 0.48036951501154734, "eval_Politician_f1": 0.5367132867132867, "eval_Politician_number": 603, "eval_Politician_precision": 0.5674676524953789, "eval_Politician_recall": 0.5091210613598673, "eval_PrivateCorp_f1": 0.5446009389671361, "eval_PrivateCorp_number": 129, "eval_PrivateCorp_precision": 0.6904761904761905, "eval_PrivateCorp_recall": 0.4496124031007752, "eval_PublicCorp_f1": 0.5916030534351144, "eval_PublicCorp_number": 243, "eval_PublicCorp_precision": 0.5516014234875445, "eval_PublicCorp_recall": 0.6378600823045267, "eval_Scientist_f1": 0.40588235294117647, "eval_Scientist_number": 189, "eval_Scientist_precision": 0.45695364238410596, "eval_Scientist_recall": 0.36507936507936506, "eval_Software_f1": 0.7483660130718954, "eval_Software_number": 307, "eval_Software_precision": 0.7508196721311475, "eval_Software_recall": 0.745928338762215, "eval_SportsGRP_f1": 0.8040455120101138, "eval_SportsGRP_number": 385, "eval_SportsGRP_precision": 0.7832512315270936, "eval_SportsGRP_recall": 0.825974025974026, "eval_SportsManager_f1": 0.5928143712574849, "eval_SportsManager_number": 194, "eval_SportsManager_precision": 0.7071428571428572, "eval_SportsManager_recall": 0.5103092783505154, "eval_Station_f1": 0.7416267942583731, "eval_Station_number": 194, "eval_Station_precision": 0.6919642857142857, "eval_Station_recall": 0.7989690721649485, "eval_Symptom_f1": 0.44621513944223107, "eval_Symptom_number": 129, "eval_Symptom_precision": 0.45901639344262296, "eval_Symptom_recall": 0.43410852713178294, "eval_Vehicle_f1": 0.5725190839694656, "eval_Vehicle_number": 206, "eval_Vehicle_precision": 0.4716981132075472, "eval_Vehicle_recall": 0.7281553398058253, "eval_VisualWork_f1": 0.7538247566063978, "eval_VisualWork_number": 693, "eval_VisualWork_precision": 0.72751677852349, "eval_VisualWork_recall": 0.7821067821067821, "eval_WrittenWork_f1": 0.6522522522522523, "eval_WrittenWork_number": 563, "eval_WrittenWork_precision": 0.6617915904936015, "eval_WrittenWork_recall": 0.6429840142095915, "eval_loss": 0.22884519398212433, "eval_overall_accuracy": 0.931677907068222, "eval_overall_f1": 0.6826710001477322, "eval_overall_precision": 0.6711204705540629, "eval_overall_recall": 0.6946260804208944, "eval_runtime": 43.7991, "eval_samples_per_second": 203.086, "eval_steps_per_second": 25.389, "step": 42706 }, { "epoch": 2.01, "learning_rate": 8.657487628592392e-06, "loss": 0.207, "step": 43000 }, { "epoch": 2.04, "learning_rate": 8.641877019622536e-06, "loss": 0.1895, "step": 43500 }, { "epoch": 2.06, "learning_rate": 8.62626641065268e-06, "loss": 0.1952, "step": 44000 }, { "epoch": 2.08, "learning_rate": 8.610655801682824e-06, "loss": 0.1875, "step": 44500 }, { "epoch": 2.11, "learning_rate": 8.595045192712968e-06, "loss": 0.1944, "step": 45000 }, { "epoch": 2.13, "learning_rate": 8.579434583743112e-06, "loss": 0.1868, "step": 45500 }, { "epoch": 2.15, "learning_rate": 8.563823974773256e-06, "loss": 0.1911, "step": 46000 }, { "epoch": 2.18, "learning_rate": 8.5482133658034e-06, "loss": 0.2001, "step": 46500 }, { "epoch": 2.2, "learning_rate": 8.532602756833544e-06, "loss": 0.1983, "step": 47000 }, { "epoch": 2.22, "learning_rate": 8.516992147863689e-06, "loss": 0.1855, "step": 47500 }, { "epoch": 2.25, "learning_rate": 8.501381538893833e-06, "loss": 0.1943, "step": 48000 }, { "epoch": 2.27, "learning_rate": 8.485770929923977e-06, "loss": 0.1876, "step": 48500 }, { "epoch": 2.29, "learning_rate": 8.470160320954122e-06, "loss": 0.1895, "step": 49000 }, { "epoch": 2.32, "learning_rate": 8.454549711984266e-06, "loss": 0.1938, "step": 49500 }, { "epoch": 2.34, "learning_rate": 8.43893910301441e-06, "loss": 0.1865, "step": 50000 }, { "epoch": 2.37, "learning_rate": 8.423328494044554e-06, "loss": 0.1941, "step": 50500 }, { "epoch": 2.39, "learning_rate": 8.407717885074697e-06, "loss": 0.1856, "step": 51000 }, { "epoch": 2.41, "learning_rate": 8.392107276104841e-06, "loss": 0.1938, "step": 51500 }, { "epoch": 2.44, "learning_rate": 8.376496667134985e-06, "loss": 0.1896, "step": 52000 }, { "epoch": 2.46, "learning_rate": 8.360886058165129e-06, "loss": 0.1873, "step": 52500 }, { "epoch": 2.48, "learning_rate": 8.345275449195273e-06, "loss": 0.1955, "step": 53000 }, { "epoch": 2.51, "learning_rate": 8.329664840225417e-06, "loss": 0.1875, "step": 53500 }, { "epoch": 2.53, "learning_rate": 8.314054231255561e-06, "loss": 0.1873, "step": 54000 }, { "epoch": 2.55, "learning_rate": 8.298443622285705e-06, "loss": 0.1977, "step": 54500 }, { "epoch": 2.58, "learning_rate": 8.28283301331585e-06, "loss": 0.1973, "step": 55000 }, { "epoch": 2.6, "learning_rate": 8.267222404345995e-06, "loss": 0.1853, "step": 55500 }, { "epoch": 2.62, "learning_rate": 8.251611795376139e-06, "loss": 0.1979, "step": 56000 }, { "epoch": 2.65, "learning_rate": 8.236001186406283e-06, "loss": 0.1881, "step": 56500 }, { "epoch": 2.67, "learning_rate": 8.220390577436427e-06, "loss": 0.1893, "step": 57000 }, { "epoch": 2.69, "learning_rate": 8.204779968466571e-06, "loss": 0.1936, "step": 57500 }, { "epoch": 2.72, "learning_rate": 8.189169359496715e-06, "loss": 0.1913, "step": 58000 }, { "epoch": 2.74, "learning_rate": 8.17355875052686e-06, "loss": 0.1861, "step": 58500 }, { "epoch": 2.76, "learning_rate": 8.157948141557003e-06, "loss": 0.1843, "step": 59000 }, { "epoch": 2.79, "learning_rate": 8.142337532587147e-06, "loss": 0.1874, "step": 59500 }, { "epoch": 2.81, "learning_rate": 8.126726923617291e-06, "loss": 0.1867, "step": 60000 }, { "epoch": 2.83, "learning_rate": 8.111116314647435e-06, "loss": 0.1863, "step": 60500 }, { "epoch": 2.86, "learning_rate": 8.09550570567758e-06, "loss": 0.1923, "step": 61000 }, { "epoch": 2.88, "learning_rate": 8.079895096707723e-06, "loss": 0.1961, "step": 61500 }, { "epoch": 2.9, "learning_rate": 8.064284487737868e-06, "loss": 0.181, "step": 62000 }, { "epoch": 2.93, "learning_rate": 8.048673878768012e-06, "loss": 0.1822, "step": 62500 }, { "epoch": 2.95, "learning_rate": 8.033063269798156e-06, "loss": 0.1842, "step": 63000 }, { "epoch": 2.97, "learning_rate": 8.0174526608283e-06, "loss": 0.1931, "step": 63500 }, { "epoch": 3.0, "learning_rate": 8.001842051858444e-06, "loss": 0.1965, "step": 64000 }, { "epoch": 3.0, "eval_AerospaceManufacturer_f1": 0.7682119205298014, "eval_AerospaceManufacturer_number": 138, "eval_AerospaceManufacturer_precision": 0.7073170731707317, "eval_AerospaceManufacturer_recall": 0.8405797101449275, "eval_AnatomicalStructure_f1": 0.7006369426751592, "eval_AnatomicalStructure_number": 227, "eval_AnatomicalStructure_precision": 0.6762295081967213, "eval_AnatomicalStructure_recall": 0.7268722466960352, "eval_ArtWork_f1": 0.5801526717557252, "eval_ArtWork_number": 131, "eval_ArtWork_precision": 0.5801526717557252, "eval_ArtWork_recall": 0.5801526717557252, "eval_Artist_f1": 0.7747237177670728, "eval_Artist_number": 1722, "eval_Artist_precision": 0.7565024903154399, "eval_Artist_recall": 0.7938443670150988, "eval_Athlete_f1": 0.7408906882591093, "eval_Athlete_number": 719, "eval_Athlete_precision": 0.7195281782437746, "eval_Athlete_recall": 0.7635605006954103, "eval_CarManufacturer_f1": 0.742857142857143, "eval_CarManufacturer_number": 159, "eval_CarManufacturer_precision": 0.680628272251309, "eval_CarManufacturer_recall": 0.8176100628930818, "eval_Cleric_f1": 0.5868945868945868, "eval_Cleric_number": 201, "eval_Cleric_precision": 0.6866666666666666, "eval_Cleric_recall": 0.5124378109452736, "eval_Clothing_f1": 0.6015037593984963, "eval_Clothing_number": 128, "eval_Clothing_precision": 0.5797101449275363, "eval_Clothing_recall": 0.625, "eval_Disease_f1": 0.6504854368932038, "eval_Disease_number": 198, "eval_Disease_precision": 0.6261682242990654, "eval_Disease_recall": 0.6767676767676768, "eval_Drink_f1": 0.7682119205298013, "eval_Drink_number": 143, "eval_Drink_precision": 0.7295597484276729, "eval_Drink_recall": 0.8111888111888111, "eval_Facility_f1": 0.6799620132953467, "eval_Facility_number": 497, "eval_Facility_precision": 0.6438848920863309, "eval_Facility_recall": 0.7203219315895373, "eval_Food_f1": 0.5968586387434555, "eval_Food_number": 214, "eval_Food_precision": 0.6785714285714286, "eval_Food_recall": 0.5327102803738317, "eval_HumanSettlement_f1": 0.8691834942932396, "eval_HumanSettlement_number": 1689, "eval_HumanSettlement_precision": 0.859375, "eval_HumanSettlement_recall": 0.8792184724689165, "eval_MedicalProcedure_f1": 0.7035830618892507, "eval_MedicalProcedure_number": 142, "eval_MedicalProcedure_precision": 0.6545454545454545, "eval_MedicalProcedure_recall": 0.7605633802816901, "eval_Medication/Vaccine_f1": 0.7409200968523003, "eval_Medication/Vaccine_number": 200, "eval_Medication/Vaccine_precision": 0.7183098591549296, "eval_Medication/Vaccine_recall": 0.765, "eval_MusicalGRP_f1": 0.7399741267787839, "eval_MusicalGRP_number": 372, "eval_MusicalGRP_precision": 0.713216957605985, "eval_MusicalGRP_recall": 0.7688172043010753, "eval_MusicalWork_f1": 0.7275031685678074, "eval_MusicalWork_number": 407, "eval_MusicalWork_precision": 0.7513089005235603, "eval_MusicalWork_recall": 0.7051597051597052, "eval_ORG_f1": 0.6224256292906178, "eval_ORG_number": 667, "eval_ORG_precision": 0.6335403726708074, "eval_ORG_recall": 0.6116941529235382, "eval_OtherLOC_f1": 0.6797066014669927, "eval_OtherLOC_number": 224, "eval_OtherLOC_precision": 0.7513513513513513, "eval_OtherLOC_recall": 0.6205357142857143, "eval_OtherPER_f1": 0.5112474437627812, "eval_OtherPER_number": 859, "eval_OtherPER_precision": 0.45578851412944393, "eval_OtherPER_recall": 0.5820721769499418, "eval_OtherPROD_f1": 0.5797101449275364, "eval_OtherPROD_number": 433, "eval_OtherPROD_precision": 0.6075949367088608, "eval_OtherPROD_recall": 0.5542725173210161, "eval_Politician_f1": 0.5417057169634489, "eval_Politician_number": 603, "eval_Politician_precision": 0.6228448275862069, "eval_Politician_recall": 0.4792703150912106, "eval_PrivateCorp_f1": 0.5806451612903226, "eval_PrivateCorp_number": 129, "eval_PrivateCorp_precision": 0.7159090909090909, "eval_PrivateCorp_recall": 0.4883720930232558, "eval_PublicCorp_f1": 0.6187845303867403, "eval_PublicCorp_number": 243, "eval_PublicCorp_precision": 0.56, "eval_PublicCorp_recall": 0.691358024691358, "eval_Scientist_f1": 0.45212765957446804, "eval_Scientist_number": 189, "eval_Scientist_precision": 0.45454545454545453, "eval_Scientist_recall": 0.4497354497354497, "eval_Software_f1": 0.7576687116564418, "eval_Software_number": 307, "eval_Software_precision": 0.7159420289855073, "eval_Software_recall": 0.8045602605863192, "eval_SportsGRP_f1": 0.8251231527093595, "eval_SportsGRP_number": 385, "eval_SportsGRP_precision": 0.7845433255269321, "eval_SportsGRP_recall": 0.8701298701298701, "eval_SportsManager_f1": 0.5942857142857142, "eval_SportsManager_number": 194, "eval_SportsManager_precision": 0.6666666666666666, "eval_SportsManager_recall": 0.5360824742268041, "eval_Station_f1": 0.7733990147783251, "eval_Station_number": 194, "eval_Station_precision": 0.7405660377358491, "eval_Station_recall": 0.8092783505154639, "eval_Symptom_f1": 0.5925925925925927, "eval_Symptom_number": 129, "eval_Symptom_precision": 0.631578947368421, "eval_Symptom_recall": 0.5581395348837209, "eval_Vehicle_f1": 0.5968819599109132, "eval_Vehicle_number": 206, "eval_Vehicle_precision": 0.551440329218107, "eval_Vehicle_recall": 0.6504854368932039, "eval_VisualWork_f1": 0.7738764044943821, "eval_VisualWork_number": 693, "eval_VisualWork_precision": 0.7537619699042407, "eval_VisualWork_recall": 0.7950937950937951, "eval_WrittenWork_f1": 0.6857654431512982, "eval_WrittenWork_number": 563, "eval_WrittenWork_precision": 0.6913357400722022, "eval_WrittenWork_recall": 0.6802841918294849, "eval_loss": 0.21482913196086884, "eval_overall_accuracy": 0.9355327807299229, "eval_overall_f1": 0.7033048369786461, "eval_overall_precision": 0.6927675707203266, "eval_overall_recall": 0.7141676061630966, "eval_runtime": 43.7848, "eval_samples_per_second": 203.153, "eval_steps_per_second": 25.397, "step": 64059 }, { "epoch": 3.02, "learning_rate": 7.986231442888588e-06, "loss": 0.159, "step": 64500 }, { "epoch": 3.04, "learning_rate": 7.970620833918732e-06, "loss": 0.157, "step": 65000 }, { "epoch": 3.07, "learning_rate": 7.955010224948876e-06, "loss": 0.1504, "step": 65500 }, { "epoch": 3.09, "learning_rate": 7.93939961597902e-06, "loss": 0.1578, "step": 66000 }, { "epoch": 3.11, "learning_rate": 7.923789007009164e-06, "loss": 0.1627, "step": 66500 }, { "epoch": 3.14, "learning_rate": 7.908178398039308e-06, "loss": 0.1606, "step": 67000 }, { "epoch": 3.16, "learning_rate": 7.892567789069452e-06, "loss": 0.1516, "step": 67500 }, { "epoch": 3.18, "learning_rate": 7.876957180099596e-06, "loss": 0.1601, "step": 68000 }, { "epoch": 3.21, "learning_rate": 7.86134657112974e-06, "loss": 0.1548, "step": 68500 }, { "epoch": 3.23, "learning_rate": 7.845735962159884e-06, "loss": 0.1661, "step": 69000 }, { "epoch": 3.25, "learning_rate": 7.830125353190028e-06, "loss": 0.1546, "step": 69500 }, { "epoch": 3.28, "learning_rate": 7.814514744220172e-06, "loss": 0.1553, "step": 70000 }, { "epoch": 3.3, "learning_rate": 7.798904135250316e-06, "loss": 0.1614, "step": 70500 }, { "epoch": 3.33, "learning_rate": 7.78329352628046e-06, "loss": 0.1601, "step": 71000 }, { "epoch": 3.35, "learning_rate": 7.767682917310604e-06, "loss": 0.1635, "step": 71500 }, { "epoch": 3.37, "learning_rate": 7.752072308340748e-06, "loss": 0.159, "step": 72000 }, { "epoch": 3.4, "learning_rate": 7.736461699370892e-06, "loss": 0.1655, "step": 72500 }, { "epoch": 3.42, "learning_rate": 7.720851090401037e-06, "loss": 0.1554, "step": 73000 }, { "epoch": 3.44, "learning_rate": 7.70524048143118e-06, "loss": 0.1558, "step": 73500 }, { "epoch": 3.47, "learning_rate": 7.689629872461325e-06, "loss": 0.1498, "step": 74000 }, { "epoch": 3.49, "learning_rate": 7.674019263491469e-06, "loss": 0.1565, "step": 74500 }, { "epoch": 3.51, "learning_rate": 7.658408654521613e-06, "loss": 0.1562, "step": 75000 }, { "epoch": 3.54, "learning_rate": 7.642798045551758e-06, "loss": 0.1639, "step": 75500 }, { "epoch": 3.56, "learning_rate": 7.6271874365819025e-06, "loss": 0.1625, "step": 76000 }, { "epoch": 3.58, "learning_rate": 7.611576827612046e-06, "loss": 0.156, "step": 76500 }, { "epoch": 3.61, "learning_rate": 7.59596621864219e-06, "loss": 0.1563, "step": 77000 }, { "epoch": 3.63, "learning_rate": 7.580355609672334e-06, "loss": 0.1563, "step": 77500 }, { "epoch": 3.65, "learning_rate": 7.564745000702478e-06, "loss": 0.151, "step": 78000 }, { "epoch": 3.68, "learning_rate": 7.549134391732622e-06, "loss": 0.1562, "step": 78500 }, { "epoch": 3.7, "learning_rate": 7.533523782762766e-06, "loss": 0.1593, "step": 79000 }, { "epoch": 3.72, "learning_rate": 7.51791317379291e-06, "loss": 0.1573, "step": 79500 }, { "epoch": 3.75, "learning_rate": 7.502302564823054e-06, "loss": 0.155, "step": 80000 }, { "epoch": 3.77, "learning_rate": 7.486691955853198e-06, "loss": 0.1579, "step": 80500 }, { "epoch": 3.79, "learning_rate": 7.471081346883342e-06, "loss": 0.1622, "step": 81000 }, { "epoch": 3.82, "learning_rate": 7.455470737913486e-06, "loss": 0.1571, "step": 81500 }, { "epoch": 3.84, "learning_rate": 7.439860128943631e-06, "loss": 0.1653, "step": 82000 }, { "epoch": 3.86, "learning_rate": 7.424249519973775e-06, "loss": 0.1675, "step": 82500 }, { "epoch": 3.89, "learning_rate": 7.408638911003919e-06, "loss": 0.1546, "step": 83000 }, { "epoch": 3.91, "learning_rate": 7.393028302034063e-06, "loss": 0.1572, "step": 83500 }, { "epoch": 3.93, "learning_rate": 7.377417693064207e-06, "loss": 0.1617, "step": 84000 }, { "epoch": 3.96, "learning_rate": 7.361807084094351e-06, "loss": 0.1637, "step": 84500 }, { "epoch": 3.98, "learning_rate": 7.346196475124495e-06, "loss": 0.1665, "step": 85000 }, { "epoch": 4.0, "eval_AerospaceManufacturer_f1": 0.8085106382978724, "eval_AerospaceManufacturer_number": 138, "eval_AerospaceManufacturer_precision": 0.7916666666666666, "eval_AerospaceManufacturer_recall": 0.8260869565217391, "eval_AnatomicalStructure_f1": 0.7145969498910675, "eval_AnatomicalStructure_number": 227, "eval_AnatomicalStructure_precision": 0.7068965517241379, "eval_AnatomicalStructure_recall": 0.7224669603524229, "eval_ArtWork_f1": 0.6263345195729537, "eval_ArtWork_number": 131, "eval_ArtWork_precision": 0.5866666666666667, "eval_ArtWork_recall": 0.6717557251908397, "eval_Artist_f1": 0.7822603719599428, "eval_Artist_number": 1722, "eval_Artist_precision": 0.7710095882684715, "eval_Artist_recall": 0.7938443670150988, "eval_Athlete_f1": 0.7289595758780649, "eval_Athlete_number": 719, "eval_Athlete_precision": 0.6962025316455697, "eval_Athlete_recall": 0.7649513212795549, "eval_CarManufacturer_f1": 0.8098159509202455, "eval_CarManufacturer_number": 159, "eval_CarManufacturer_precision": 0.7904191616766467, "eval_CarManufacturer_recall": 0.8301886792452831, "eval_Cleric_f1": 0.5737265415549598, "eval_Cleric_number": 201, "eval_Cleric_precision": 0.622093023255814, "eval_Cleric_recall": 0.5323383084577115, "eval_Clothing_f1": 0.6159420289855073, "eval_Clothing_number": 128, "eval_Clothing_precision": 0.5743243243243243, "eval_Clothing_recall": 0.6640625, "eval_Disease_f1": 0.6513761467889907, "eval_Disease_number": 198, "eval_Disease_precision": 0.5966386554621849, "eval_Disease_recall": 0.7171717171717171, "eval_Drink_f1": 0.7801418439716313, "eval_Drink_number": 143, "eval_Drink_precision": 0.7913669064748201, "eval_Drink_recall": 0.7692307692307693, "eval_Facility_f1": 0.6730219256434699, "eval_Facility_number": 497, "eval_Facility_precision": 0.6394927536231884, "eval_Facility_recall": 0.710261569416499, "eval_Food_f1": 0.6267942583732058, "eval_Food_number": 214, "eval_Food_precision": 0.6421568627450981, "eval_Food_recall": 0.6121495327102804, "eval_HumanSettlement_f1": 0.8683314415437003, "eval_HumanSettlement_number": 1689, "eval_HumanSettlement_precision": 0.8337874659400545, "eval_HumanSettlement_recall": 0.9058614564831261, "eval_MedicalProcedure_f1": 0.6938775510204082, "eval_MedicalProcedure_number": 142, "eval_MedicalProcedure_precision": 0.6710526315789473, "eval_MedicalProcedure_recall": 0.7183098591549296, "eval_Medication/Vaccine_f1": 0.7692307692307692, "eval_Medication/Vaccine_number": 200, "eval_Medication/Vaccine_precision": 0.7635467980295566, "eval_Medication/Vaccine_recall": 0.775, "eval_MusicalGRP_f1": 0.7638326585695007, "eval_MusicalGRP_number": 372, "eval_MusicalGRP_precision": 0.7669376693766937, "eval_MusicalGRP_recall": 0.760752688172043, "eval_MusicalWork_f1": 0.7366020524515393, "eval_MusicalWork_number": 407, "eval_MusicalWork_precision": 0.6872340425531915, "eval_MusicalWork_recall": 0.7936117936117936, "eval_ORG_f1": 0.6493083807973963, "eval_ORG_number": 667, "eval_ORG_precision": 0.7099644128113879, "eval_ORG_recall": 0.5982008995502249, "eval_OtherLOC_f1": 0.7228381374722838, "eval_OtherLOC_number": 224, "eval_OtherLOC_precision": 0.7180616740088106, "eval_OtherLOC_recall": 0.7276785714285714, "eval_OtherPER_f1": 0.5129032258064515, "eval_OtherPER_number": 859, "eval_OtherPER_precision": 0.47652347652347654, "eval_OtherPER_recall": 0.5552968568102444, "eval_OtherPROD_f1": 0.6040428061831153, "eval_OtherPROD_number": 433, "eval_OtherPROD_precision": 0.6225490196078431, "eval_OtherPROD_recall": 0.5866050808314087, "eval_Politician_f1": 0.5599284436493738, "eval_Politician_number": 603, "eval_Politician_precision": 0.6077669902912621, "eval_Politician_recall": 0.5190713101160862, "eval_PrivateCorp_f1": 0.593607305936073, "eval_PrivateCorp_number": 129, "eval_PrivateCorp_precision": 0.7222222222222222, "eval_PrivateCorp_recall": 0.5038759689922481, "eval_PublicCorp_f1": 0.6799276672694394, "eval_PublicCorp_number": 243, "eval_PublicCorp_precision": 0.6064516129032258, "eval_PublicCorp_recall": 0.7736625514403292, "eval_Scientist_f1": 0.5, "eval_Scientist_number": 189, "eval_Scientist_precision": 0.4782608695652174, "eval_Scientist_recall": 0.5238095238095238, "eval_Software_f1": 0.7632398753894081, "eval_Software_number": 307, "eval_Software_precision": 0.7313432835820896, "eval_Software_recall": 0.7980456026058632, "eval_SportsGRP_f1": 0.8498074454428755, "eval_SportsGRP_number": 385, "eval_SportsGRP_precision": 0.8401015228426396, "eval_SportsGRP_recall": 0.8597402597402597, "eval_SportsManager_f1": 0.6268656716417911, "eval_SportsManager_number": 194, "eval_SportsManager_precision": 0.6057692307692307, "eval_SportsManager_recall": 0.6494845360824743, "eval_Station_f1": 0.7719298245614034, "eval_Station_number": 194, "eval_Station_precision": 0.751219512195122, "eval_Station_recall": 0.7938144329896907, "eval_Symptom_f1": 0.6612244897959184, "eval_Symptom_number": 129, "eval_Symptom_precision": 0.6982758620689655, "eval_Symptom_recall": 0.627906976744186, "eval_Vehicle_f1": 0.6420824295010846, "eval_Vehicle_number": 206, "eval_Vehicle_precision": 0.5803921568627451, "eval_Vehicle_recall": 0.7184466019417476, "eval_VisualWork_f1": 0.7804195804195805, "eval_VisualWork_number": 693, "eval_VisualWork_precision": 0.757123473541384, "eval_VisualWork_recall": 0.8051948051948052, "eval_WrittenWork_f1": 0.6903914590747331, "eval_WrittenWork_number": 563, "eval_WrittenWork_precision": 0.6916221033868093, "eval_WrittenWork_recall": 0.6891651865008881, "eval_loss": 0.2192559540271759, "eval_overall_accuracy": 0.9374780973087403, "eval_overall_f1": 0.7157577095753294, "eval_overall_precision": 0.7012041243060062, "eval_overall_recall": 0.7309282224727546, "eval_runtime": 43.8304, "eval_samples_per_second": 202.942, "eval_steps_per_second": 25.371, "step": 85412 }, { "epoch": 4.0, "learning_rate": 7.330585866154639e-06, "loss": 0.1597, "step": 85500 }, { "epoch": 4.03, "learning_rate": 7.314975257184783e-06, "loss": 0.1339, "step": 86000 }, { "epoch": 4.05, "learning_rate": 7.2993646482149274e-06, "loss": 0.1355, "step": 86500 }, { "epoch": 4.07, "learning_rate": 7.2837540392450715e-06, "loss": 0.1332, "step": 87000 }, { "epoch": 4.1, "learning_rate": 7.2681434302752155e-06, "loss": 0.1334, "step": 87500 }, { "epoch": 4.12, "learning_rate": 7.2525328213053596e-06, "loss": 0.1373, "step": 88000 }, { "epoch": 4.14, "learning_rate": 7.2369222123355045e-06, "loss": 0.1289, "step": 88500 }, { "epoch": 4.17, "learning_rate": 7.2213116033656485e-06, "loss": 0.1298, "step": 89000 }, { "epoch": 4.19, "learning_rate": 7.2057009943957926e-06, "loss": 0.1382, "step": 89500 }, { "epoch": 4.21, "learning_rate": 7.190090385425937e-06, "loss": 0.1322, "step": 90000 }, { "epoch": 4.24, "learning_rate": 7.174479776456081e-06, "loss": 0.1283, "step": 90500 }, { "epoch": 4.26, "learning_rate": 7.158869167486225e-06, "loss": 0.1317, "step": 91000 }, { "epoch": 4.29, "learning_rate": 7.143258558516368e-06, "loss": 0.1347, "step": 91500 }, { "epoch": 4.31, "learning_rate": 7.127647949546512e-06, "loss": 0.1299, "step": 92000 }, { "epoch": 4.33, "learning_rate": 7.112037340576656e-06, "loss": 0.1325, "step": 92500 }, { "epoch": 4.36, "learning_rate": 7.0964267316068e-06, "loss": 0.131, "step": 93000 }, { "epoch": 4.38, "learning_rate": 7.080816122636944e-06, "loss": 0.1354, "step": 93500 }, { "epoch": 4.4, "learning_rate": 7.065205513667088e-06, "loss": 0.136, "step": 94000 }, { "epoch": 4.43, "learning_rate": 7.049594904697232e-06, "loss": 0.1373, "step": 94500 }, { "epoch": 4.45, "learning_rate": 7.033984295727377e-06, "loss": 0.1365, "step": 95000 }, { "epoch": 4.47, "learning_rate": 7.018373686757521e-06, "loss": 0.1327, "step": 95500 }, { "epoch": 4.5, "learning_rate": 7.002763077787665e-06, "loss": 0.1315, "step": 96000 }, { "epoch": 4.52, "learning_rate": 6.987152468817809e-06, "loss": 0.1297, "step": 96500 }, { "epoch": 4.54, "learning_rate": 6.971541859847953e-06, "loss": 0.1307, "step": 97000 }, { "epoch": 4.57, "learning_rate": 6.955931250878097e-06, "loss": 0.1374, "step": 97500 }, { "epoch": 4.59, "learning_rate": 6.940320641908241e-06, "loss": 0.1327, "step": 98000 }, { "epoch": 4.61, "learning_rate": 6.924710032938385e-06, "loss": 0.1367, "step": 98500 }, { "epoch": 4.64, "learning_rate": 6.909099423968529e-06, "loss": 0.1314, "step": 99000 }, { "epoch": 4.66, "learning_rate": 6.8934888149986735e-06, "loss": 0.1351, "step": 99500 }, { "epoch": 4.68, "learning_rate": 6.8778782060288175e-06, "loss": 0.1263, "step": 100000 }, { "epoch": 4.71, "learning_rate": 6.8622675970589616e-06, "loss": 0.1337, "step": 100500 }, { "epoch": 4.73, "learning_rate": 6.846656988089106e-06, "loss": 0.1332, "step": 101000 }, { "epoch": 4.75, "learning_rate": 6.8310463791192505e-06, "loss": 0.127, "step": 101500 }, { "epoch": 4.78, "learning_rate": 6.8154357701493945e-06, "loss": 0.1357, "step": 102000 }, { "epoch": 4.8, "learning_rate": 6.799825161179539e-06, "loss": 0.1382, "step": 102500 }, { "epoch": 4.82, "learning_rate": 6.784214552209683e-06, "loss": 0.1335, "step": 103000 }, { "epoch": 4.85, "learning_rate": 6.768603943239827e-06, "loss": 0.1273, "step": 103500 }, { "epoch": 4.87, "learning_rate": 6.752993334269971e-06, "loss": 0.1386, "step": 104000 }, { "epoch": 4.89, "learning_rate": 6.737382725300115e-06, "loss": 0.136, "step": 104500 }, { "epoch": 4.92, "learning_rate": 6.721772116330259e-06, "loss": 0.1369, "step": 105000 }, { "epoch": 4.94, "learning_rate": 6.706161507360403e-06, "loss": 0.1386, "step": 105500 }, { "epoch": 4.96, "learning_rate": 6.690550898390547e-06, "loss": 0.1397, "step": 106000 }, { "epoch": 4.99, "learning_rate": 6.67494028942069e-06, "loss": 0.1314, "step": 106500 }, { "epoch": 5.0, "eval_AerospaceManufacturer_f1": 0.8203389830508476, "eval_AerospaceManufacturer_number": 138, "eval_AerospaceManufacturer_precision": 0.7707006369426752, "eval_AerospaceManufacturer_recall": 0.8768115942028986, "eval_AnatomicalStructure_f1": 0.7350427350427351, "eval_AnatomicalStructure_number": 227, "eval_AnatomicalStructure_precision": 0.7136929460580913, "eval_AnatomicalStructure_recall": 0.7577092511013216, "eval_ArtWork_f1": 0.6194029850746268, "eval_ArtWork_number": 131, "eval_ArtWork_precision": 0.6058394160583942, "eval_ArtWork_recall": 0.6335877862595419, "eval_Artist_f1": 0.7818666666666667, "eval_Artist_number": 1722, "eval_Artist_precision": 0.722879684418146, "eval_Artist_recall": 0.851335656213705, "eval_Athlete_f1": 0.7555856465809072, "eval_Athlete_number": 719, "eval_Athlete_precision": 0.7361477572559367, "eval_Athlete_recall": 0.7760778859527121, "eval_CarManufacturer_f1": 0.7500000000000001, "eval_CarManufacturer_number": 159, "eval_CarManufacturer_precision": 0.6839378238341969, "eval_CarManufacturer_recall": 0.8301886792452831, "eval_Cleric_f1": 0.5931372549019609, "eval_Cleric_number": 201, "eval_Cleric_precision": 0.5845410628019324, "eval_Cleric_recall": 0.6019900497512438, "eval_Clothing_f1": 0.6311787072243347, "eval_Clothing_number": 128, "eval_Clothing_precision": 0.6148148148148148, "eval_Clothing_recall": 0.6484375, "eval_Disease_f1": 0.6604651162790697, "eval_Disease_number": 198, "eval_Disease_precision": 0.6120689655172413, "eval_Disease_recall": 0.7171717171717171, "eval_Drink_f1": 0.7467532467532467, "eval_Drink_number": 143, "eval_Drink_precision": 0.696969696969697, "eval_Drink_recall": 0.8041958041958042, "eval_Facility_f1": 0.6698841698841699, "eval_Facility_number": 497, "eval_Facility_precision": 0.6437847866419295, "eval_Facility_recall": 0.6981891348088531, "eval_Food_f1": 0.6473214285714286, "eval_Food_number": 214, "eval_Food_precision": 0.6196581196581197, "eval_Food_recall": 0.677570093457944, "eval_HumanSettlement_f1": 0.863139735480161, "eval_HumanSettlement_number": 1689, "eval_HumanSettlement_precision": 0.8390162101732812, "eval_HumanSettlement_recall": 0.8886915334517466, "eval_MedicalProcedure_f1": 0.7148014440433214, "eval_MedicalProcedure_number": 142, "eval_MedicalProcedure_precision": 0.7333333333333333, "eval_MedicalProcedure_recall": 0.6971830985915493, "eval_Medication/Vaccine_f1": 0.7780429594272076, "eval_Medication/Vaccine_number": 200, "eval_Medication/Vaccine_precision": 0.7442922374429224, "eval_Medication/Vaccine_recall": 0.815, "eval_MusicalGRP_f1": 0.7532133676092545, "eval_MusicalGRP_number": 372, "eval_MusicalGRP_precision": 0.7216748768472906, "eval_MusicalGRP_recall": 0.7876344086021505, "eval_MusicalWork_f1": 0.7333333333333333, "eval_MusicalWork_number": 407, "eval_MusicalWork_precision": 0.7113163972286374, "eval_MusicalWork_recall": 0.7567567567567568, "eval_ORG_f1": 0.6600910470409712, "eval_ORG_number": 667, "eval_ORG_precision": 0.6682027649769585, "eval_ORG_recall": 0.6521739130434783, "eval_OtherLOC_f1": 0.7072072072072073, "eval_OtherLOC_number": 224, "eval_OtherLOC_precision": 0.7136363636363636, "eval_OtherLOC_recall": 0.7008928571428571, "eval_OtherPER_f1": 0.5058317986494781, "eval_OtherPER_number": 859, "eval_OtherPER_precision": 0.535064935064935, "eval_OtherPER_recall": 0.479627473806752, "eval_OtherPROD_f1": 0.6089887640449437, "eval_OtherPROD_number": 433, "eval_OtherPROD_precision": 0.5929978118161926, "eval_OtherPROD_recall": 0.625866050808314, "eval_Politician_f1": 0.5642857142857143, "eval_Politician_number": 603, "eval_Politician_precision": 0.6112185686653772, "eval_Politician_recall": 0.5240464344941956, "eval_PrivateCorp_f1": 0.6896551724137931, "eval_PrivateCorp_number": 129, "eval_PrivateCorp_precision": 0.7766990291262136, "eval_PrivateCorp_recall": 0.6201550387596899, "eval_PublicCorp_f1": 0.6730038022813688, "eval_PublicCorp_number": 243, "eval_PublicCorp_precision": 0.6254416961130742, "eval_PublicCorp_recall": 0.7283950617283951, "eval_Scientist_f1": 0.48148148148148145, "eval_Scientist_number": 189, "eval_Scientist_precision": 0.48148148148148145, "eval_Scientist_recall": 0.48148148148148145, "eval_Software_f1": 0.7860538827258321, "eval_Software_number": 307, "eval_Software_precision": 0.7654320987654321, "eval_Software_recall": 0.8078175895765473, "eval_SportsGRP_f1": 0.8219832735961768, "eval_SportsGRP_number": 385, "eval_SportsGRP_precision": 0.7610619469026548, "eval_SportsGRP_recall": 0.8935064935064935, "eval_SportsManager_f1": 0.6361185983827493, "eval_SportsManager_number": 194, "eval_SportsManager_precision": 0.6666666666666666, "eval_SportsManager_recall": 0.6082474226804123, "eval_Station_f1": 0.7908163265306123, "eval_Station_number": 194, "eval_Station_precision": 0.7828282828282829, "eval_Station_recall": 0.7989690721649485, "eval_Symptom_f1": 0.6793893129770991, "eval_Symptom_number": 129, "eval_Symptom_precision": 0.6691729323308271, "eval_Symptom_recall": 0.689922480620155, "eval_Vehicle_f1": 0.6426966292134831, "eval_Vehicle_number": 206, "eval_Vehicle_precision": 0.5983263598326359, "eval_Vehicle_recall": 0.6941747572815534, "eval_VisualWork_f1": 0.7858136300417247, "eval_VisualWork_number": 693, "eval_VisualWork_precision": 0.7583892617449665, "eval_VisualWork_recall": 0.8152958152958153, "eval_WrittenWork_f1": 0.689236111111111, "eval_WrittenWork_number": 563, "eval_WrittenWork_precision": 0.6740237691001698, "eval_WrittenWork_recall": 0.7051509769094139, "eval_loss": 0.22715534269809723, "eval_overall_accuracy": 0.9377927808729608, "eval_overall_f1": 0.7198099415204678, "eval_overall_precision": 0.7006047669868374, "eval_overall_recall": 0.740097707628711, "eval_runtime": 43.8136, "eval_samples_per_second": 203.019, "eval_steps_per_second": 25.38, "step": 106765 }, { "epoch": 5.01, "learning_rate": 6.659329680450834e-06, "loss": 0.1261, "step": 107000 }, { "epoch": 5.03, "learning_rate": 6.643719071480978e-06, "loss": 0.1168, "step": 107500 }, { "epoch": 5.06, "learning_rate": 6.628108462511124e-06, "loss": 0.11, "step": 108000 }, { "epoch": 5.08, "learning_rate": 6.612497853541268e-06, "loss": 0.1045, "step": 108500 }, { "epoch": 5.1, "learning_rate": 6.596887244571412e-06, "loss": 0.1143, "step": 109000 }, { "epoch": 5.13, "learning_rate": 6.581276635601555e-06, "loss": 0.1086, "step": 109500 }, { "epoch": 5.15, "learning_rate": 6.565666026631699e-06, "loss": 0.1117, "step": 110000 }, { "epoch": 5.17, "learning_rate": 6.550055417661843e-06, "loss": 0.1104, "step": 110500 }, { "epoch": 5.2, "learning_rate": 6.534444808691987e-06, "loss": 0.1097, "step": 111000 }, { "epoch": 5.22, "learning_rate": 6.518834199722131e-06, "loss": 0.1148, "step": 111500 }, { "epoch": 5.25, "learning_rate": 6.5032235907522754e-06, "loss": 0.1141, "step": 112000 }, { "epoch": 5.27, "learning_rate": 6.4876129817824195e-06, "loss": 0.1071, "step": 112500 }, { "epoch": 5.29, "learning_rate": 6.4720023728125635e-06, "loss": 0.1111, "step": 113000 }, { "epoch": 5.32, "learning_rate": 6.456391763842708e-06, "loss": 0.1148, "step": 113500 }, { "epoch": 5.34, "learning_rate": 6.440781154872852e-06, "loss": 0.1208, "step": 114000 }, { "epoch": 5.36, "learning_rate": 6.4251705459029965e-06, "loss": 0.1176, "step": 114500 }, { "epoch": 5.39, "learning_rate": 6.4095599369331406e-06, "loss": 0.1178, "step": 115000 }, { "epoch": 5.41, "learning_rate": 6.393949327963285e-06, "loss": 0.1175, "step": 115500 }, { "epoch": 5.43, "learning_rate": 6.378338718993429e-06, "loss": 0.1123, "step": 116000 }, { "epoch": 5.46, "learning_rate": 6.362728110023573e-06, "loss": 0.1152, "step": 116500 }, { "epoch": 5.48, "learning_rate": 6.347117501053717e-06, "loss": 0.1237, "step": 117000 }, { "epoch": 5.5, "learning_rate": 6.331506892083861e-06, "loss": 0.1136, "step": 117500 }, { "epoch": 5.53, "learning_rate": 6.315896283114005e-06, "loss": 0.1113, "step": 118000 }, { "epoch": 5.55, "learning_rate": 6.300285674144149e-06, "loss": 0.1132, "step": 118500 }, { "epoch": 5.57, "learning_rate": 6.284675065174293e-06, "loss": 0.1136, "step": 119000 }, { "epoch": 5.6, "learning_rate": 6.269064456204437e-06, "loss": 0.116, "step": 119500 }, { "epoch": 5.62, "learning_rate": 6.253453847234581e-06, "loss": 0.1186, "step": 120000 }, { "epoch": 5.64, "learning_rate": 6.237843238264725e-06, "loss": 0.1122, "step": 120500 }, { "epoch": 5.67, "learning_rate": 6.22223262929487e-06, "loss": 0.1158, "step": 121000 }, { "epoch": 5.69, "learning_rate": 6.206622020325014e-06, "loss": 0.1151, "step": 121500 }, { "epoch": 5.71, "learning_rate": 6.191011411355158e-06, "loss": 0.1194, "step": 122000 }, { "epoch": 5.74, "learning_rate": 6.175400802385302e-06, "loss": 0.1117, "step": 122500 }, { "epoch": 5.76, "learning_rate": 6.159790193415446e-06, "loss": 0.1096, "step": 123000 }, { "epoch": 5.78, "learning_rate": 6.14417958444559e-06, "loss": 0.1177, "step": 123500 }, { "epoch": 5.81, "learning_rate": 6.128568975475734e-06, "loss": 0.1137, "step": 124000 }, { "epoch": 5.83, "learning_rate": 6.1129583665058774e-06, "loss": 0.1179, "step": 124500 }, { "epoch": 5.85, "learning_rate": 6.0973477575360215e-06, "loss": 0.1138, "step": 125000 }, { "epoch": 5.88, "learning_rate": 6.0817371485661655e-06, "loss": 0.1152, "step": 125500 }, { "epoch": 5.9, "learning_rate": 6.0661265395963096e-06, "loss": 0.1095, "step": 126000 }, { "epoch": 5.92, "learning_rate": 6.050515930626454e-06, "loss": 0.1141, "step": 126500 }, { "epoch": 5.95, "learning_rate": 6.034905321656598e-06, "loss": 0.1142, "step": 127000 }, { "epoch": 5.97, "learning_rate": 6.0192947126867425e-06, "loss": 0.111, "step": 127500 }, { "epoch": 5.99, "learning_rate": 6.003684103716887e-06, "loss": 0.1224, "step": 128000 }, { "epoch": 6.0, "eval_AerospaceManufacturer_f1": 0.8345323741007195, "eval_AerospaceManufacturer_number": 138, "eval_AerospaceManufacturer_precision": 0.8285714285714286, "eval_AerospaceManufacturer_recall": 0.8405797101449275, "eval_AnatomicalStructure_f1": 0.7161016949152542, "eval_AnatomicalStructure_number": 227, "eval_AnatomicalStructure_precision": 0.689795918367347, "eval_AnatomicalStructure_recall": 0.7444933920704846, "eval_ArtWork_f1": 0.657439446366782, "eval_ArtWork_number": 131, "eval_ArtWork_precision": 0.6012658227848101, "eval_ArtWork_recall": 0.7251908396946565, "eval_Artist_f1": 0.7972489683631361, "eval_Artist_number": 1722, "eval_Artist_precision": 0.7574490329325666, "eval_Artist_recall": 0.8414634146341463, "eval_Athlete_f1": 0.7441217150760719, "eval_Athlete_number": 719, "eval_Athlete_precision": 0.7400275103163686, "eval_Athlete_recall": 0.7482614742698191, "eval_CarManufacturer_f1": 0.8282208588957056, "eval_CarManufacturer_number": 159, "eval_CarManufacturer_precision": 0.8083832335329342, "eval_CarManufacturer_recall": 0.8490566037735849, "eval_Cleric_f1": 0.631868131868132, "eval_Cleric_number": 201, "eval_Cleric_precision": 0.7055214723926381, "eval_Cleric_recall": 0.572139303482587, "eval_Clothing_f1": 0.6153846153846154, "eval_Clothing_number": 128, "eval_Clothing_precision": 0.6060606060606061, "eval_Clothing_recall": 0.625, "eval_Disease_f1": 0.6925064599483205, "eval_Disease_number": 198, "eval_Disease_precision": 0.708994708994709, "eval_Disease_recall": 0.6767676767676768, "eval_Drink_f1": 0.7670250896057347, "eval_Drink_number": 143, "eval_Drink_precision": 0.7867647058823529, "eval_Drink_recall": 0.7482517482517482, "eval_Facility_f1": 0.6957328385899815, "eval_Facility_number": 497, "eval_Facility_precision": 0.6454388984509466, "eval_Facility_recall": 0.7545271629778671, "eval_Food_f1": 0.6607538802660754, "eval_Food_number": 214, "eval_Food_precision": 0.6286919831223629, "eval_Food_recall": 0.6962616822429907, "eval_HumanSettlement_f1": 0.8696916812100058, "eval_HumanSettlement_number": 1689, "eval_HumanSettlement_precision": 0.8547741566609491, "eval_HumanSettlement_recall": 0.8851391355831854, "eval_MedicalProcedure_f1": 0.7418181818181818, "eval_MedicalProcedure_number": 142, "eval_MedicalProcedure_precision": 0.7669172932330827, "eval_MedicalProcedure_recall": 0.7183098591549296, "eval_Medication/Vaccine_f1": 0.7857142857142856, "eval_Medication/Vaccine_number": 200, "eval_Medication/Vaccine_precision": 0.75, "eval_Medication/Vaccine_recall": 0.825, "eval_MusicalGRP_f1": 0.7661691542288557, "eval_MusicalGRP_number": 372, "eval_MusicalGRP_precision": 0.7129629629629629, "eval_MusicalGRP_recall": 0.8279569892473119, "eval_MusicalWork_f1": 0.7404063205417607, "eval_MusicalWork_number": 407, "eval_MusicalWork_precision": 0.6847599164926931, "eval_MusicalWork_recall": 0.8058968058968059, "eval_ORG_f1": 0.6771406127258445, "eval_ORG_number": 667, "eval_ORG_precision": 0.7112211221122112, "eval_ORG_recall": 0.6461769115442278, "eval_OtherLOC_f1": 0.7393364928909952, "eval_OtherLOC_number": 224, "eval_OtherLOC_precision": 0.7878787878787878, "eval_OtherLOC_recall": 0.6964285714285714, "eval_OtherPER_f1": 0.5378346915017462, "eval_OtherPER_number": 859, "eval_OtherPER_precision": 0.5378346915017462, "eval_OtherPER_recall": 0.5378346915017462, "eval_OtherPROD_f1": 0.6151960784313726, "eval_OtherPROD_number": 433, "eval_OtherPROD_precision": 0.6553524804177546, "eval_OtherPROD_recall": 0.5796766743648961, "eval_Politician_f1": 0.5916666666666666, "eval_Politician_number": 603, "eval_Politician_precision": 0.5946398659966499, "eval_Politician_recall": 0.5887230514096186, "eval_PrivateCorp_f1": 0.7372881355932203, "eval_PrivateCorp_number": 129, "eval_PrivateCorp_precision": 0.8130841121495327, "eval_PrivateCorp_recall": 0.6744186046511628, "eval_PublicCorp_f1": 0.7054409005628517, "eval_PublicCorp_number": 243, "eval_PublicCorp_precision": 0.6482758620689655, "eval_PublicCorp_recall": 0.7736625514403292, "eval_Scientist_f1": 0.53551912568306, "eval_Scientist_number": 189, "eval_Scientist_precision": 0.5536723163841808, "eval_Scientist_recall": 0.5185185185185185, "eval_Software_f1": 0.784, "eval_Software_number": 307, "eval_Software_precision": 0.7704402515723271, "eval_Software_recall": 0.7980456026058632, "eval_SportsGRP_f1": 0.8679245283018868, "eval_SportsGRP_number": 385, "eval_SportsGRP_precision": 0.8414634146341463, "eval_SportsGRP_recall": 0.8961038961038961, "eval_SportsManager_f1": 0.663265306122449, "eval_SportsManager_number": 194, "eval_SportsManager_precision": 0.6565656565656566, "eval_SportsManager_recall": 0.6701030927835051, "eval_Station_f1": 0.7959183673469388, "eval_Station_number": 194, "eval_Station_precision": 0.7878787878787878, "eval_Station_recall": 0.8041237113402062, "eval_Symptom_f1": 0.6894197952218429, "eval_Symptom_number": 129, "eval_Symptom_precision": 0.6158536585365854, "eval_Symptom_recall": 0.7829457364341085, "eval_Vehicle_f1": 0.643171806167401, "eval_Vehicle_number": 206, "eval_Vehicle_precision": 0.5887096774193549, "eval_Vehicle_recall": 0.7087378640776699, "eval_VisualWork_f1": 0.7942857142857144, "eval_VisualWork_number": 693, "eval_VisualWork_precision": 0.7864214992927864, "eval_VisualWork_recall": 0.8023088023088023, "eval_WrittenWork_f1": 0.7044609665427509, "eval_WrittenWork_number": 563, "eval_WrittenWork_precision": 0.7387914230019493, "eval_WrittenWork_recall": 0.6731793960923623, "eval_loss": 0.22752739489078522, "eval_overall_accuracy": 0.9406249329509451, "eval_overall_f1": 0.7345913807747703, "eval_overall_precision": 0.7220850878466676, "eval_overall_recall": 0.7475385193536265, "eval_runtime": 44.5182, "eval_samples_per_second": 199.806, "eval_steps_per_second": 24.979, "step": 128118 }, { "epoch": 6.02, "learning_rate": 5.988073494747031e-06, "loss": 0.0957, "step": 128500 }, { "epoch": 6.04, "learning_rate": 5.972462885777175e-06, "loss": 0.0884, "step": 129000 }, { "epoch": 6.06, "learning_rate": 5.956852276807319e-06, "loss": 0.0953, "step": 129500 }, { "epoch": 6.09, "learning_rate": 5.941241667837463e-06, "loss": 0.0941, "step": 130000 }, { "epoch": 6.11, "learning_rate": 5.925631058867607e-06, "loss": 0.0958, "step": 130500 }, { "epoch": 6.13, "learning_rate": 5.910020449897751e-06, "loss": 0.0963, "step": 131000 }, { "epoch": 6.16, "learning_rate": 5.894409840927895e-06, "loss": 0.0947, "step": 131500 }, { "epoch": 6.18, "learning_rate": 5.878799231958039e-06, "loss": 0.0963, "step": 132000 }, { "epoch": 6.21, "learning_rate": 5.863188622988183e-06, "loss": 0.0941, "step": 132500 }, { "epoch": 6.23, "learning_rate": 5.847578014018327e-06, "loss": 0.0948, "step": 133000 }, { "epoch": 6.25, "learning_rate": 5.831967405048471e-06, "loss": 0.0984, "step": 133500 }, { "epoch": 6.28, "learning_rate": 5.816356796078616e-06, "loss": 0.0987, "step": 134000 }, { "epoch": 6.3, "learning_rate": 5.80074618710876e-06, "loss": 0.1006, "step": 134500 }, { "epoch": 6.32, "learning_rate": 5.785135578138904e-06, "loss": 0.0955, "step": 135000 }, { "epoch": 6.35, "learning_rate": 5.769524969169048e-06, "loss": 0.0964, "step": 135500 }, { "epoch": 6.37, "learning_rate": 5.753914360199192e-06, "loss": 0.1005, "step": 136000 }, { "epoch": 6.39, "learning_rate": 5.738303751229336e-06, "loss": 0.0985, "step": 136500 }, { "epoch": 6.42, "learning_rate": 5.72269314225948e-06, "loss": 0.0969, "step": 137000 }, { "epoch": 6.44, "learning_rate": 5.707082533289624e-06, "loss": 0.0961, "step": 137500 }, { "epoch": 6.46, "learning_rate": 5.691471924319768e-06, "loss": 0.0986, "step": 138000 }, { "epoch": 6.49, "learning_rate": 5.675861315349912e-06, "loss": 0.0942, "step": 138500 }, { "epoch": 6.51, "learning_rate": 5.6602507063800564e-06, "loss": 0.1067, "step": 139000 }, { "epoch": 6.53, "learning_rate": 5.6446400974102e-06, "loss": 0.0984, "step": 139500 }, { "epoch": 6.56, "learning_rate": 5.629029488440344e-06, "loss": 0.099, "step": 140000 }, { "epoch": 6.58, "learning_rate": 5.613418879470489e-06, "loss": 0.0987, "step": 140500 }, { "epoch": 6.6, "learning_rate": 5.5978082705006335e-06, "loss": 0.092, "step": 141000 }, { "epoch": 6.63, "learning_rate": 5.5821976615307775e-06, "loss": 0.0973, "step": 141500 }, { "epoch": 6.65, "learning_rate": 5.5665870525609216e-06, "loss": 0.0989, "step": 142000 }, { "epoch": 6.67, "learning_rate": 5.550976443591065e-06, "loss": 0.0972, "step": 142500 }, { "epoch": 6.7, "learning_rate": 5.535365834621209e-06, "loss": 0.0961, "step": 143000 }, { "epoch": 6.72, "learning_rate": 5.519755225651353e-06, "loss": 0.0995, "step": 143500 }, { "epoch": 6.74, "learning_rate": 5.504144616681497e-06, "loss": 0.0931, "step": 144000 }, { "epoch": 6.77, "learning_rate": 5.488534007711641e-06, "loss": 0.1078, "step": 144500 }, { "epoch": 6.79, "learning_rate": 5.472923398741785e-06, "loss": 0.0958, "step": 145000 }, { "epoch": 6.81, "learning_rate": 5.457312789771929e-06, "loss": 0.0967, "step": 145500 }, { "epoch": 6.84, "learning_rate": 5.441702180802073e-06, "loss": 0.0976, "step": 146000 }, { "epoch": 6.86, "learning_rate": 5.426091571832217e-06, "loss": 0.0946, "step": 146500 }, { "epoch": 6.88, "learning_rate": 5.410480962862362e-06, "loss": 0.0981, "step": 147000 }, { "epoch": 6.91, "learning_rate": 5.394870353892506e-06, "loss": 0.0968, "step": 147500 }, { "epoch": 6.93, "learning_rate": 5.37925974492265e-06, "loss": 0.0965, "step": 148000 }, { "epoch": 6.95, "learning_rate": 5.363649135952794e-06, "loss": 0.0985, "step": 148500 }, { "epoch": 6.98, "learning_rate": 5.348038526982938e-06, "loss": 0.0964, "step": 149000 }, { "epoch": 7.0, "eval_AerospaceManufacturer_f1": 0.8304498269896193, "eval_AerospaceManufacturer_number": 138, "eval_AerospaceManufacturer_precision": 0.7947019867549668, "eval_AerospaceManufacturer_recall": 0.8695652173913043, "eval_AnatomicalStructure_f1": 0.7334754797441364, "eval_AnatomicalStructure_number": 227, "eval_AnatomicalStructure_precision": 0.7107438016528925, "eval_AnatomicalStructure_recall": 0.7577092511013216, "eval_ArtWork_f1": 0.6691449814126395, "eval_ArtWork_number": 131, "eval_ArtWork_precision": 0.6521739130434783, "eval_ArtWork_recall": 0.6870229007633588, "eval_Artist_f1": 0.7976224172091708, "eval_Artist_number": 1722, "eval_Artist_precision": 0.7780231916068471, "eval_Artist_recall": 0.8182346109175378, "eval_Athlete_f1": 0.7513966480446927, "eval_Athlete_number": 719, "eval_Athlete_precision": 0.7545582047685835, "eval_Athlete_recall": 0.7482614742698191, "eval_CarManufacturer_f1": 0.8109756097560975, "eval_CarManufacturer_number": 159, "eval_CarManufacturer_precision": 0.7869822485207101, "eval_CarManufacturer_recall": 0.8364779874213837, "eval_Cleric_f1": 0.6019900497512438, "eval_Cleric_number": 201, "eval_Cleric_precision": 0.6019900497512438, "eval_Cleric_recall": 0.6019900497512438, "eval_Clothing_f1": 0.6258992805755395, "eval_Clothing_number": 128, "eval_Clothing_precision": 0.58, "eval_Clothing_recall": 0.6796875, "eval_Disease_f1": 0.6816143497757847, "eval_Disease_number": 198, "eval_Disease_precision": 0.6129032258064516, "eval_Disease_recall": 0.7676767676767676, "eval_Drink_f1": 0.7840531561461794, "eval_Drink_number": 143, "eval_Drink_precision": 0.7468354430379747, "eval_Drink_recall": 0.8251748251748252, "eval_Facility_f1": 0.6948176583493282, "eval_Facility_number": 497, "eval_Facility_precision": 0.6642201834862386, "eval_Facility_recall": 0.7283702213279678, "eval_Food_f1": 0.6807511737089202, "eval_Food_number": 214, "eval_Food_precision": 0.6839622641509434, "eval_Food_recall": 0.677570093457944, "eval_HumanSettlement_f1": 0.869666861484512, "eval_HumanSettlement_number": 1689, "eval_HumanSettlement_precision": 0.8586266589728794, "eval_HumanSettlement_recall": 0.8809946714031972, "eval_MedicalProcedure_f1": 0.7608695652173914, "eval_MedicalProcedure_number": 142, "eval_MedicalProcedure_precision": 0.7835820895522388, "eval_MedicalProcedure_recall": 0.7394366197183099, "eval_Medication/Vaccine_f1": 0.7621247113163971, "eval_Medication/Vaccine_number": 200, "eval_Medication/Vaccine_precision": 0.7081545064377682, "eval_Medication/Vaccine_recall": 0.825, "eval_MusicalGRP_f1": 0.7802929427430093, "eval_MusicalGRP_number": 372, "eval_MusicalGRP_precision": 0.7730870712401056, "eval_MusicalGRP_recall": 0.7876344086021505, "eval_MusicalWork_f1": 0.7549504950495051, "eval_MusicalWork_number": 407, "eval_MusicalWork_precision": 0.7605985037406484, "eval_MusicalWork_recall": 0.7493857493857494, "eval_ORG_f1": 0.6780669144981413, "eval_ORG_number": 667, "eval_ORG_precision": 0.672566371681416, "eval_ORG_recall": 0.6836581709145427, "eval_OtherLOC_f1": 0.7425968109339407, "eval_OtherLOC_number": 224, "eval_OtherLOC_precision": 0.7581395348837209, "eval_OtherLOC_recall": 0.7276785714285714, "eval_OtherPER_f1": 0.5395763656633222, "eval_OtherPER_number": 859, "eval_OtherPER_precision": 0.5176470588235295, "eval_OtherPER_recall": 0.5634458672875436, "eval_OtherPROD_f1": 0.6287787182587666, "eval_OtherPROD_number": 433, "eval_OtherPROD_precision": 0.6598984771573604, "eval_OtherPROD_recall": 0.6004618937644342, "eval_Politician_f1": 0.5801526717557253, "eval_Politician_number": 603, "eval_Politician_precision": 0.59375, "eval_Politician_recall": 0.5671641791044776, "eval_PrivateCorp_f1": 0.7577092511013216, "eval_PrivateCorp_number": 129, "eval_PrivateCorp_precision": 0.8775510204081632, "eval_PrivateCorp_recall": 0.6666666666666666, "eval_PublicCorp_f1": 0.74, "eval_PublicCorp_number": 243, "eval_PublicCorp_precision": 0.7198443579766537, "eval_PublicCorp_recall": 0.7613168724279835, "eval_Scientist_f1": 0.5130890052356021, "eval_Scientist_number": 189, "eval_Scientist_precision": 0.5077720207253886, "eval_Scientist_recall": 0.5185185185185185, "eval_Software_f1": 0.7841845140032949, "eval_Software_number": 307, "eval_Software_precision": 0.7933333333333333, "eval_Software_recall": 0.7752442996742671, "eval_SportsGRP_f1": 0.8448275862068965, "eval_SportsGRP_number": 385, "eval_SportsGRP_precision": 0.8032786885245902, "eval_SportsGRP_recall": 0.8909090909090909, "eval_SportsManager_f1": 0.6507177033492823, "eval_SportsManager_number": 194, "eval_SportsManager_precision": 0.6071428571428571, "eval_SportsManager_recall": 0.7010309278350515, "eval_Station_f1": 0.7722772277227722, "eval_Station_number": 194, "eval_Station_precision": 0.7428571428571429, "eval_Station_recall": 0.8041237113402062, "eval_Symptom_f1": 0.6804979253112033, "eval_Symptom_number": 129, "eval_Symptom_precision": 0.7321428571428571, "eval_Symptom_recall": 0.6356589147286822, "eval_Vehicle_f1": 0.6422413793103449, "eval_Vehicle_number": 206, "eval_Vehicle_precision": 0.5775193798449613, "eval_Vehicle_recall": 0.7233009708737864, "eval_VisualWork_f1": 0.7925608011444921, "eval_VisualWork_number": 693, "eval_VisualWork_precision": 0.7858156028368795, "eval_VisualWork_recall": 0.7994227994227994, "eval_WrittenWork_f1": 0.6966864910790145, "eval_WrittenWork_number": 563, "eval_WrittenWork_precision": 0.6677524429967426, "eval_WrittenWork_recall": 0.7282415630550622, "eval_loss": 0.24561241269111633, "eval_overall_accuracy": 0.940338856983472, "eval_overall_f1": 0.7334341236771268, "eval_overall_precision": 0.7199218184450558, "eval_overall_recall": 0.7474633596392334, "eval_runtime": 43.7555, "eval_samples_per_second": 203.289, "eval_steps_per_second": 25.414, "step": 149471 }, { "epoch": 7.0, "learning_rate": 5.332427918013082e-06, "loss": 0.0977, "step": 149500 }, { "epoch": 7.02, "learning_rate": 5.316817309043226e-06, "loss": 0.0849, "step": 150000 }, { "epoch": 7.05, "learning_rate": 5.30120670007337e-06, "loss": 0.0842, "step": 150500 }, { "epoch": 7.07, "learning_rate": 5.285596091103514e-06, "loss": 0.0822, "step": 151000 }, { "epoch": 7.1, "learning_rate": 5.269985482133658e-06, "loss": 0.0775, "step": 151500 }, { "epoch": 7.12, "learning_rate": 5.2543748731638025e-06, "loss": 0.0878, "step": 152000 }, { "epoch": 7.14, "learning_rate": 5.2387642641939465e-06, "loss": 0.0835, "step": 152500 }, { "epoch": 7.17, "learning_rate": 5.2231536552240906e-06, "loss": 0.0792, "step": 153000 }, { "epoch": 7.19, "learning_rate": 5.2075430462542354e-06, "loss": 0.0908, "step": 153500 }, { "epoch": 7.21, "learning_rate": 5.1919324372843795e-06, "loss": 0.0862, "step": 154000 }, { "epoch": 7.24, "learning_rate": 5.1763218283145235e-06, "loss": 0.0823, "step": 154500 }, { "epoch": 7.26, "learning_rate": 5.160711219344668e-06, "loss": 0.0785, "step": 155000 }, { "epoch": 7.28, "learning_rate": 5.145100610374812e-06, "loss": 0.0827, "step": 155500 }, { "epoch": 7.31, "learning_rate": 5.129490001404956e-06, "loss": 0.081, "step": 156000 }, { "epoch": 7.33, "learning_rate": 5.1138793924351e-06, "loss": 0.0814, "step": 156500 }, { "epoch": 7.35, "learning_rate": 5.098268783465244e-06, "loss": 0.0799, "step": 157000 }, { "epoch": 7.38, "learning_rate": 5.082658174495387e-06, "loss": 0.0907, "step": 157500 }, { "epoch": 7.4, "learning_rate": 5.067047565525531e-06, "loss": 0.0862, "step": 158000 }, { "epoch": 7.42, "learning_rate": 5.051436956555675e-06, "loss": 0.0844, "step": 158500 }, { "epoch": 7.45, "learning_rate": 5.035826347585819e-06, "loss": 0.0795, "step": 159000 }, { "epoch": 7.47, "learning_rate": 5.020215738615963e-06, "loss": 0.0862, "step": 159500 }, { "epoch": 7.49, "learning_rate": 5.004605129646108e-06, "loss": 0.0813, "step": 160000 }, { "epoch": 7.52, "learning_rate": 4.988994520676252e-06, "loss": 0.0802, "step": 160500 }, { "epoch": 7.54, "learning_rate": 4.973383911706396e-06, "loss": 0.0871, "step": 161000 }, { "epoch": 7.56, "learning_rate": 4.95777330273654e-06, "loss": 0.0811, "step": 161500 }, { "epoch": 7.59, "learning_rate": 4.942162693766684e-06, "loss": 0.0801, "step": 162000 }, { "epoch": 7.61, "learning_rate": 4.926552084796828e-06, "loss": 0.0872, "step": 162500 }, { "epoch": 7.63, "learning_rate": 4.910941475826972e-06, "loss": 0.0825, "step": 163000 }, { "epoch": 7.66, "learning_rate": 4.895330866857116e-06, "loss": 0.0873, "step": 163500 }, { "epoch": 7.68, "learning_rate": 4.87972025788726e-06, "loss": 0.0873, "step": 164000 }, { "epoch": 7.7, "learning_rate": 4.8641096489174044e-06, "loss": 0.0938, "step": 164500 }, { "epoch": 7.73, "learning_rate": 4.848499039947549e-06, "loss": 0.088, "step": 165000 }, { "epoch": 7.75, "learning_rate": 4.832888430977693e-06, "loss": 0.089, "step": 165500 }, { "epoch": 7.77, "learning_rate": 4.817277822007837e-06, "loss": 0.0801, "step": 166000 }, { "epoch": 7.8, "learning_rate": 4.801667213037981e-06, "loss": 0.0881, "step": 166500 }, { "epoch": 7.82, "learning_rate": 4.786056604068125e-06, "loss": 0.084, "step": 167000 }, { "epoch": 7.84, "learning_rate": 4.770445995098269e-06, "loss": 0.0853, "step": 167500 }, { "epoch": 7.87, "learning_rate": 4.754835386128413e-06, "loss": 0.0826, "step": 168000 }, { "epoch": 7.89, "learning_rate": 4.739224777158558e-06, "loss": 0.0817, "step": 168500 }, { "epoch": 7.91, "learning_rate": 4.723614168188702e-06, "loss": 0.0857, "step": 169000 }, { "epoch": 7.94, "learning_rate": 4.708003559218846e-06, "loss": 0.0814, "step": 169500 }, { "epoch": 7.96, "learning_rate": 4.69239295024899e-06, "loss": 0.079, "step": 170000 }, { "epoch": 7.98, "learning_rate": 4.676782341279134e-06, "loss": 0.0838, "step": 170500 }, { "epoch": 8.0, "eval_AerospaceManufacturer_f1": 0.8243243243243245, "eval_AerospaceManufacturer_number": 138, "eval_AerospaceManufacturer_precision": 0.7721518987341772, "eval_AerospaceManufacturer_recall": 0.8840579710144928, "eval_AnatomicalStructure_f1": 0.731808731808732, "eval_AnatomicalStructure_number": 227, "eval_AnatomicalStructure_precision": 0.6929133858267716, "eval_AnatomicalStructure_recall": 0.775330396475771, "eval_ArtWork_f1": 0.681159420289855, "eval_ArtWork_number": 131, "eval_ArtWork_precision": 0.6482758620689655, "eval_ArtWork_recall": 0.7175572519083969, "eval_Artist_f1": 0.7978267086073777, "eval_Artist_number": 1722, "eval_Artist_precision": 0.7859154929577464, "eval_Artist_recall": 0.8101045296167247, "eval_Athlete_f1": 0.7366946778711484, "eval_Athlete_number": 719, "eval_Athlete_precision": 0.7418899858956276, "eval_Athlete_recall": 0.7315716272600834, "eval_CarManufacturer_f1": 0.7846607669616519, "eval_CarManufacturer_number": 159, "eval_CarManufacturer_precision": 0.7388888888888889, "eval_CarManufacturer_recall": 0.8364779874213837, "eval_Cleric_f1": 0.5882352941176471, "eval_Cleric_number": 201, "eval_Cleric_precision": 0.5797101449275363, "eval_Cleric_recall": 0.5970149253731343, "eval_Clothing_f1": 0.6304347826086957, "eval_Clothing_number": 128, "eval_Clothing_precision": 0.5878378378378378, "eval_Clothing_recall": 0.6796875, "eval_Disease_f1": 0.6859903381642511, "eval_Disease_number": 198, "eval_Disease_precision": 0.6574074074074074, "eval_Disease_recall": 0.7171717171717171, "eval_Drink_f1": 0.787878787878788, "eval_Drink_number": 143, "eval_Drink_precision": 0.7597402597402597, "eval_Drink_recall": 0.8181818181818182, "eval_Facility_f1": 0.7115577889447237, "eval_Facility_number": 497, "eval_Facility_precision": 0.7108433734939759, "eval_Facility_recall": 0.7122736418511066, "eval_Food_f1": 0.6815144766146994, "eval_Food_number": 214, "eval_Food_precision": 0.6510638297872341, "eval_Food_recall": 0.7149532710280374, "eval_HumanSettlement_f1": 0.8806146572104018, "eval_HumanSettlement_number": 1689, "eval_HumanSettlement_precision": 0.8790560471976401, "eval_HumanSettlement_recall": 0.8821788040260509, "eval_MedicalProcedure_f1": 0.7552447552447553, "eval_MedicalProcedure_number": 142, "eval_MedicalProcedure_precision": 0.75, "eval_MedicalProcedure_recall": 0.7605633802816901, "eval_Medication/Vaccine_f1": 0.7815533980582525, "eval_Medication/Vaccine_number": 200, "eval_Medication/Vaccine_precision": 0.7594339622641509, "eval_Medication/Vaccine_recall": 0.805, "eval_MusicalGRP_f1": 0.7925531914893617, "eval_MusicalGRP_number": 372, "eval_MusicalGRP_precision": 0.7842105263157895, "eval_MusicalGRP_recall": 0.8010752688172043, "eval_MusicalWork_f1": 0.7598566308243727, "eval_MusicalWork_number": 407, "eval_MusicalWork_precision": 0.7395348837209302, "eval_MusicalWork_recall": 0.7813267813267813, "eval_ORG_f1": 0.6869300911854103, "eval_ORG_number": 667, "eval_ORG_precision": 0.6964560862865947, "eval_ORG_recall": 0.6776611694152923, "eval_OtherLOC_f1": 0.7336244541484715, "eval_OtherLOC_number": 224, "eval_OtherLOC_precision": 0.717948717948718, "eval_OtherLOC_recall": 0.75, "eval_OtherPER_f1": 0.5420966865833786, "eval_OtherPER_number": 859, "eval_OtherPER_precision": 0.5081466395112016, "eval_OtherPER_recall": 0.580908032596042, "eval_OtherPROD_f1": 0.624561403508772, "eval_OtherPROD_number": 433, "eval_OtherPROD_precision": 0.6327014218009479, "eval_OtherPROD_recall": 0.6166281755196305, "eval_Politician_f1": 0.5954198473282443, "eval_Politician_number": 603, "eval_Politician_precision": 0.609375, "eval_Politician_recall": 0.582089552238806, "eval_PrivateCorp_f1": 0.7577092511013216, "eval_PrivateCorp_number": 129, "eval_PrivateCorp_precision": 0.8775510204081632, "eval_PrivateCorp_recall": 0.6666666666666666, "eval_PublicCorp_f1": 0.7228915662650603, "eval_PublicCorp_number": 243, "eval_PublicCorp_precision": 0.7058823529411765, "eval_PublicCorp_recall": 0.7407407407407407, "eval_Scientist_f1": 0.5311653116531165, "eval_Scientist_number": 189, "eval_Scientist_precision": 0.5444444444444444, "eval_Scientist_recall": 0.5185185185185185, "eval_Software_f1": 0.7833065810593901, "eval_Software_number": 307, "eval_Software_precision": 0.7721518987341772, "eval_Software_recall": 0.7947882736156352, "eval_SportsGRP_f1": 0.8407960199004975, "eval_SportsGRP_number": 385, "eval_SportsGRP_precision": 0.8066825775656324, "eval_SportsGRP_recall": 0.8779220779220779, "eval_SportsManager_f1": 0.6600000000000001, "eval_SportsManager_number": 194, "eval_SportsManager_precision": 0.6407766990291263, "eval_SportsManager_recall": 0.6804123711340206, "eval_Station_f1": 0.7951219512195122, "eval_Station_number": 194, "eval_Station_precision": 0.7546296296296297, "eval_Station_recall": 0.8402061855670103, "eval_Symptom_f1": 0.7158671586715867, "eval_Symptom_number": 129, "eval_Symptom_precision": 0.6830985915492958, "eval_Symptom_recall": 0.751937984496124, "eval_Vehicle_f1": 0.6666666666666667, "eval_Vehicle_number": 206, "eval_Vehicle_precision": 0.625531914893617, "eval_Vehicle_recall": 0.7135922330097088, "eval_VisualWork_f1": 0.7875927174645989, "eval_VisualWork_number": 693, "eval_VisualWork_precision": 0.739240506329114, "eval_VisualWork_recall": 0.8427128427128427, "eval_WrittenWork_f1": 0.7177637511271415, "eval_WrittenWork_number": 563, "eval_WrittenWork_precision": 0.7289377289377289, "eval_WrittenWork_recall": 0.7069271758436945, "eval_loss": 0.2562252879142761, "eval_overall_accuracy": 0.9414116418614963, "eval_overall_f1": 0.7375603998377042, "eval_overall_precision": 0.7241778936694191, "eval_overall_recall": 0.7514468245020669, "eval_runtime": 44.7176, "eval_samples_per_second": 198.915, "eval_steps_per_second": 24.867, "step": 170824 }, { "epoch": 8.01, "learning_rate": 4.661171732309278e-06, "loss": 0.0827, "step": 171000 }, { "epoch": 8.03, "learning_rate": 4.645561123339422e-06, "loss": 0.0683, "step": 171500 }, { "epoch": 8.06, "learning_rate": 4.629950514369566e-06, "loss": 0.0683, "step": 172000 }, { "epoch": 8.08, "learning_rate": 4.61433990539971e-06, "loss": 0.0721, "step": 172500 }, { "epoch": 8.1, "learning_rate": 4.598729296429854e-06, "loss": 0.0719, "step": 173000 }, { "epoch": 8.13, "learning_rate": 4.583118687459998e-06, "loss": 0.0744, "step": 173500 }, { "epoch": 8.15, "learning_rate": 4.567508078490142e-06, "loss": 0.0653, "step": 174000 }, { "epoch": 8.17, "learning_rate": 4.551897469520286e-06, "loss": 0.0694, "step": 174500 }, { "epoch": 8.2, "learning_rate": 4.53628686055043e-06, "loss": 0.0717, "step": 175000 }, { "epoch": 8.22, "learning_rate": 4.520676251580574e-06, "loss": 0.071, "step": 175500 }, { "epoch": 8.24, "learning_rate": 4.505065642610718e-06, "loss": 0.0697, "step": 176000 }, { "epoch": 8.27, "learning_rate": 4.489455033640862e-06, "loss": 0.0748, "step": 176500 }, { "epoch": 8.29, "learning_rate": 4.473844424671006e-06, "loss": 0.0656, "step": 177000 }, { "epoch": 8.31, "learning_rate": 4.4582338157011505e-06, "loss": 0.0711, "step": 177500 }, { "epoch": 8.34, "learning_rate": 4.442623206731295e-06, "loss": 0.0753, "step": 178000 }, { "epoch": 8.36, "learning_rate": 4.427012597761439e-06, "loss": 0.0697, "step": 178500 }, { "epoch": 8.38, "learning_rate": 4.4114019887915835e-06, "loss": 0.0732, "step": 179000 }, { "epoch": 8.41, "learning_rate": 4.3957913798217275e-06, "loss": 0.0742, "step": 179500 }, { "epoch": 8.43, "learning_rate": 4.3801807708518715e-06, "loss": 0.0733, "step": 180000 }, { "epoch": 8.45, "learning_rate": 4.364570161882016e-06, "loss": 0.0655, "step": 180500 }, { "epoch": 8.48, "learning_rate": 4.34895955291216e-06, "loss": 0.0701, "step": 181000 }, { "epoch": 8.5, "learning_rate": 4.333348943942304e-06, "loss": 0.0717, "step": 181500 }, { "epoch": 8.52, "learning_rate": 4.317738334972448e-06, "loss": 0.0702, "step": 182000 }, { "epoch": 8.55, "learning_rate": 4.302127726002592e-06, "loss": 0.0744, "step": 182500 }, { "epoch": 8.57, "learning_rate": 4.286517117032736e-06, "loss": 0.0759, "step": 183000 }, { "epoch": 8.59, "learning_rate": 4.27090650806288e-06, "loss": 0.078, "step": 183500 }, { "epoch": 8.62, "learning_rate": 4.255295899093024e-06, "loss": 0.0724, "step": 184000 }, { "epoch": 8.64, "learning_rate": 4.239685290123168e-06, "loss": 0.0694, "step": 184500 }, { "epoch": 8.66, "learning_rate": 4.224074681153312e-06, "loss": 0.0797, "step": 185000 }, { "epoch": 8.69, "learning_rate": 4.208464072183456e-06, "loss": 0.0726, "step": 185500 }, { "epoch": 8.71, "learning_rate": 4.1928534632136e-06, "loss": 0.0773, "step": 186000 }, { "epoch": 8.73, "learning_rate": 4.177242854243744e-06, "loss": 0.0695, "step": 186500 }, { "epoch": 8.76, "learning_rate": 4.161632245273888e-06, "loss": 0.0723, "step": 187000 }, { "epoch": 8.78, "learning_rate": 4.146021636304032e-06, "loss": 0.0719, "step": 187500 }, { "epoch": 8.8, "learning_rate": 4.130411027334177e-06, "loss": 0.0721, "step": 188000 }, { "epoch": 8.83, "learning_rate": 4.114800418364321e-06, "loss": 0.073, "step": 188500 }, { "epoch": 8.85, "learning_rate": 4.099189809394465e-06, "loss": 0.0741, "step": 189000 }, { "epoch": 8.87, "learning_rate": 4.083579200424609e-06, "loss": 0.0685, "step": 189500 }, { "epoch": 8.9, "learning_rate": 4.0679685914547524e-06, "loss": 0.0832, "step": 190000 }, { "epoch": 8.92, "learning_rate": 4.0523579824848965e-06, "loss": 0.0816, "step": 190500 }, { "epoch": 8.94, "learning_rate": 4.036747373515041e-06, "loss": 0.0679, "step": 191000 }, { "epoch": 8.97, "learning_rate": 4.0211367645451854e-06, "loss": 0.0729, "step": 191500 }, { "epoch": 8.99, "learning_rate": 4.0055261555753295e-06, "loss": 0.0753, "step": 192000 }, { "epoch": 9.0, "eval_AerospaceManufacturer_f1": 0.8413793103448277, "eval_AerospaceManufacturer_number": 138, "eval_AerospaceManufacturer_precision": 0.8026315789473685, "eval_AerospaceManufacturer_recall": 0.8840579710144928, "eval_AnatomicalStructure_f1": 0.7505154639175258, "eval_AnatomicalStructure_number": 227, "eval_AnatomicalStructure_precision": 0.7054263565891473, "eval_AnatomicalStructure_recall": 0.801762114537445, "eval_ArtWork_f1": 0.6417910447761195, "eval_ArtWork_number": 131, "eval_ArtWork_precision": 0.6277372262773723, "eval_ArtWork_recall": 0.6564885496183206, "eval_Artist_f1": 0.8059201340407707, "eval_Artist_number": 1722, "eval_Artist_precision": 0.7762237762237763, "eval_Artist_recall": 0.837979094076655, "eval_Athlete_f1": 0.7552155771905424, "eval_Athlete_number": 719, "eval_Athlete_precision": 0.7552155771905424, "eval_Athlete_recall": 0.7552155771905424, "eval_CarManufacturer_f1": 0.8048048048048047, "eval_CarManufacturer_number": 159, "eval_CarManufacturer_precision": 0.7701149425287356, "eval_CarManufacturer_recall": 0.8427672955974843, "eval_Cleric_f1": 0.619047619047619, "eval_Cleric_number": 201, "eval_Cleric_precision": 0.6610169491525424, "eval_Cleric_recall": 0.582089552238806, "eval_Clothing_f1": 0.6222222222222222, "eval_Clothing_number": 128, "eval_Clothing_precision": 0.5915492957746479, "eval_Clothing_recall": 0.65625, "eval_Disease_f1": 0.6906474820143884, "eval_Disease_number": 198, "eval_Disease_precision": 0.6575342465753424, "eval_Disease_recall": 0.7272727272727273, "eval_Drink_f1": 0.7859649122807018, "eval_Drink_number": 143, "eval_Drink_precision": 0.7887323943661971, "eval_Drink_recall": 0.7832167832167832, "eval_Facility_f1": 0.7105788423153692, "eval_Facility_number": 497, "eval_Facility_precision": 0.7049504950495049, "eval_Facility_recall": 0.716297786720322, "eval_Food_f1": 0.6781115879828327, "eval_Food_number": 214, "eval_Food_precision": 0.626984126984127, "eval_Food_recall": 0.7383177570093458, "eval_HumanSettlement_f1": 0.8655510675129833, "eval_HumanSettlement_number": 1689, "eval_HumanSettlement_precision": 0.8441193021947102, "eval_HumanSettlement_recall": 0.8880994671403197, "eval_MedicalProcedure_f1": 0.7561837455830389, "eval_MedicalProcedure_number": 142, "eval_MedicalProcedure_precision": 0.7588652482269503, "eval_MedicalProcedure_recall": 0.7535211267605634, "eval_Medication/Vaccine_f1": 0.7772727272727273, "eval_Medication/Vaccine_number": 200, "eval_Medication/Vaccine_precision": 0.7125, "eval_Medication/Vaccine_recall": 0.855, "eval_MusicalGRP_f1": 0.7823834196891192, "eval_MusicalGRP_number": 372, "eval_MusicalGRP_precision": 0.755, "eval_MusicalGRP_recall": 0.8118279569892473, "eval_MusicalWork_f1": 0.775267538644471, "eval_MusicalWork_number": 407, "eval_MusicalWork_precision": 0.7511520737327189, "eval_MusicalWork_recall": 0.800982800982801, "eval_ORG_f1": 0.687869822485207, "eval_ORG_number": 667, "eval_ORG_precision": 0.6788321167883211, "eval_ORG_recall": 0.697151424287856, "eval_OtherLOC_f1": 0.761467889908257, "eval_OtherLOC_number": 224, "eval_OtherLOC_precision": 0.7830188679245284, "eval_OtherLOC_recall": 0.7410714285714286, "eval_OtherPER_f1": 0.5467468562055768, "eval_OtherPER_number": 859, "eval_OtherPER_precision": 0.5154639175257731, "eval_OtherPER_recall": 0.5820721769499418, "eval_OtherPROD_f1": 0.6437571592210767, "eval_OtherPROD_number": 433, "eval_OtherPROD_precision": 0.6386363636363637, "eval_OtherPROD_recall": 0.648960739030023, "eval_Politician_f1": 0.618921308576481, "eval_Politician_number": 603, "eval_Politician_precision": 0.6628787878787878, "eval_Politician_recall": 0.5804311774461028, "eval_PrivateCorp_f1": 0.7796610169491526, "eval_PrivateCorp_number": 129, "eval_PrivateCorp_precision": 0.8598130841121495, "eval_PrivateCorp_recall": 0.7131782945736435, "eval_PublicCorp_f1": 0.7054263565891473, "eval_PublicCorp_number": 243, "eval_PublicCorp_precision": 0.6666666666666666, "eval_PublicCorp_recall": 0.7489711934156379, "eval_Scientist_f1": 0.505, "eval_Scientist_number": 189, "eval_Scientist_precision": 0.4786729857819905, "eval_Scientist_recall": 0.5343915343915344, "eval_Software_f1": 0.7744000000000001, "eval_Software_number": 307, "eval_Software_precision": 0.7610062893081762, "eval_Software_recall": 0.7882736156351792, "eval_SportsGRP_f1": 0.8585732165206508, "eval_SportsGRP_number": 385, "eval_SportsGRP_precision": 0.8285024154589372, "eval_SportsGRP_recall": 0.8909090909090909, "eval_SportsManager_f1": 0.6860158311345647, "eval_SportsManager_number": 194, "eval_SportsManager_precision": 0.7027027027027027, "eval_SportsManager_recall": 0.6701030927835051, "eval_Station_f1": 0.802992518703242, "eval_Station_number": 194, "eval_Station_precision": 0.7777777777777778, "eval_Station_recall": 0.8298969072164949, "eval_Symptom_f1": 0.7279411764705883, "eval_Symptom_number": 129, "eval_Symptom_precision": 0.6923076923076923, "eval_Symptom_recall": 0.7674418604651163, "eval_Vehicle_f1": 0.663551401869159, "eval_Vehicle_number": 206, "eval_Vehicle_precision": 0.6396396396396397, "eval_Vehicle_recall": 0.6893203883495146, "eval_VisualWork_f1": 0.7985765124555161, "eval_VisualWork_number": 693, "eval_VisualWork_precision": 0.7879213483146067, "eval_VisualWork_recall": 0.8095238095238095, "eval_WrittenWork_f1": 0.7116237799467613, "eval_WrittenWork_number": 563, "eval_WrittenWork_precision": 0.7109929078014184, "eval_WrittenWork_recall": 0.7122557726465364, "eval_loss": 0.270776629447937, "eval_overall_accuracy": 0.9424343634452129, "eval_overall_f1": 0.7422127534528357, "eval_overall_precision": 0.7258423737337453, "eval_overall_recall": 0.7593385945133408, "eval_runtime": 44.4548, "eval_samples_per_second": 200.091, "eval_steps_per_second": 25.014, "step": 192177 }, { "epoch": 9.02, "learning_rate": 3.9899155466054735e-06, "loss": 0.0658, "step": 192500 }, { "epoch": 9.04, "learning_rate": 3.9743049376356176e-06, "loss": 0.0611, "step": 193000 }, { "epoch": 9.06, "learning_rate": 3.958694328665762e-06, "loss": 0.0613, "step": 193500 }, { "epoch": 9.09, "learning_rate": 3.943083719695906e-06, "loss": 0.0636, "step": 194000 }, { "epoch": 9.11, "learning_rate": 3.92747311072605e-06, "loss": 0.0645, "step": 194500 }, { "epoch": 9.13, "learning_rate": 3.911862501756194e-06, "loss": 0.0597, "step": 195000 }, { "epoch": 9.16, "learning_rate": 3.896251892786338e-06, "loss": 0.0638, "step": 195500 }, { "epoch": 9.18, "learning_rate": 3.880641283816482e-06, "loss": 0.0606, "step": 196000 }, { "epoch": 9.2, "learning_rate": 3.865030674846626e-06, "loss": 0.0622, "step": 196500 }, { "epoch": 9.23, "learning_rate": 3.84942006587677e-06, "loss": 0.0569, "step": 197000 }, { "epoch": 9.25, "learning_rate": 3.833809456906915e-06, "loss": 0.0606, "step": 197500 }, { "epoch": 9.27, "learning_rate": 3.818198847937059e-06, "loss": 0.0626, "step": 198000 }, { "epoch": 9.3, "learning_rate": 3.8025882389672025e-06, "loss": 0.0624, "step": 198500 }, { "epoch": 9.32, "learning_rate": 3.7869776299973465e-06, "loss": 0.0696, "step": 199000 }, { "epoch": 9.34, "learning_rate": 3.7713670210274906e-06, "loss": 0.0662, "step": 199500 }, { "epoch": 9.37, "learning_rate": 3.7557564120576346e-06, "loss": 0.0613, "step": 200000 }, { "epoch": 9.39, "learning_rate": 3.7401458030877787e-06, "loss": 0.0598, "step": 200500 }, { "epoch": 9.41, "learning_rate": 3.724535194117923e-06, "loss": 0.0643, "step": 201000 }, { "epoch": 9.44, "learning_rate": 3.708924585148067e-06, "loss": 0.0624, "step": 201500 }, { "epoch": 9.46, "learning_rate": 3.6933139761782112e-06, "loss": 0.0645, "step": 202000 }, { "epoch": 9.48, "learning_rate": 3.6777033672083553e-06, "loss": 0.0681, "step": 202500 }, { "epoch": 9.51, "learning_rate": 3.662092758238499e-06, "loss": 0.0583, "step": 203000 }, { "epoch": 9.53, "learning_rate": 3.646482149268643e-06, "loss": 0.0624, "step": 203500 }, { "epoch": 9.55, "learning_rate": 3.630871540298787e-06, "loss": 0.0608, "step": 204000 }, { "epoch": 9.58, "learning_rate": 3.6152609313289315e-06, "loss": 0.0609, "step": 204500 }, { "epoch": 9.6, "learning_rate": 3.5996503223590755e-06, "loss": 0.06, "step": 205000 }, { "epoch": 9.62, "learning_rate": 3.5840397133892195e-06, "loss": 0.0625, "step": 205500 }, { "epoch": 9.65, "learning_rate": 3.5684291044193636e-06, "loss": 0.0677, "step": 206000 }, { "epoch": 9.67, "learning_rate": 3.5528184954495076e-06, "loss": 0.0656, "step": 206500 }, { "epoch": 9.69, "learning_rate": 3.5372078864796517e-06, "loss": 0.0647, "step": 207000 }, { "epoch": 9.72, "learning_rate": 3.521597277509796e-06, "loss": 0.0602, "step": 207500 }, { "epoch": 9.74, "learning_rate": 3.50598666853994e-06, "loss": 0.0639, "step": 208000 }, { "epoch": 9.76, "learning_rate": 3.4903760595700842e-06, "loss": 0.0642, "step": 208500 }, { "epoch": 9.79, "learning_rate": 3.4747654506002283e-06, "loss": 0.0656, "step": 209000 }, { "epoch": 9.81, "learning_rate": 3.4591548416303723e-06, "loss": 0.0631, "step": 209500 }, { "epoch": 9.83, "learning_rate": 3.4435442326605164e-06, "loss": 0.0605, "step": 210000 }, { "epoch": 9.86, "learning_rate": 3.42793362369066e-06, "loss": 0.065, "step": 210500 }, { "epoch": 9.88, "learning_rate": 3.412323014720805e-06, "loss": 0.0617, "step": 211000 }, { "epoch": 9.9, "learning_rate": 3.396712405750949e-06, "loss": 0.0619, "step": 211500 }, { "epoch": 9.93, "learning_rate": 3.3811017967810926e-06, "loss": 0.064, "step": 212000 }, { "epoch": 9.95, "learning_rate": 3.3654911878112366e-06, "loss": 0.0647, "step": 212500 }, { "epoch": 9.98, "learning_rate": 3.3498805788413807e-06, "loss": 0.0637, "step": 213000 }, { "epoch": 10.0, "learning_rate": 3.3342699698715247e-06, "loss": 0.0574, "step": 213500 }, { "epoch": 10.0, "eval_AerospaceManufacturer_f1": 0.8464163822525597, "eval_AerospaceManufacturer_number": 138, "eval_AerospaceManufacturer_precision": 0.8, "eval_AerospaceManufacturer_recall": 0.8985507246376812, "eval_AnatomicalStructure_f1": 0.7580299785867238, "eval_AnatomicalStructure_number": 227, "eval_AnatomicalStructure_precision": 0.7375, "eval_AnatomicalStructure_recall": 0.7797356828193832, "eval_ArtWork_f1": 0.6591760299625468, "eval_ArtWork_number": 131, "eval_ArtWork_precision": 0.6470588235294118, "eval_ArtWork_recall": 0.6717557251908397, "eval_Artist_f1": 0.791846109675567, "eval_Artist_number": 1722, "eval_Artist_precision": 0.7830777967064169, "eval_Artist_recall": 0.8008130081300813, "eval_Athlete_f1": 0.7353135313531353, "eval_Athlete_number": 719, "eval_Athlete_precision": 0.699748743718593, "eval_Athlete_recall": 0.7746870653685675, "eval_CarManufacturer_f1": 0.8083832335329343, "eval_CarManufacturer_number": 159, "eval_CarManufacturer_precision": 0.7714285714285715, "eval_CarManufacturer_recall": 0.8490566037735849, "eval_Cleric_f1": 0.6030150753768844, "eval_Cleric_number": 201, "eval_Cleric_precision": 0.6091370558375635, "eval_Cleric_recall": 0.5970149253731343, "eval_Clothing_f1": 0.6381322957198443, "eval_Clothing_number": 128, "eval_Clothing_precision": 0.6356589147286822, "eval_Clothing_recall": 0.640625, "eval_Disease_f1": 0.7035175879396985, "eval_Disease_number": 198, "eval_Disease_precision": 0.7, "eval_Disease_recall": 0.7070707070707071, "eval_Drink_f1": 0.7759197324414715, "eval_Drink_number": 143, "eval_Drink_precision": 0.7435897435897436, "eval_Drink_recall": 0.8111888111888111, "eval_Facility_f1": 0.6976744186046512, "eval_Facility_number": 497, "eval_Facility_precision": 0.6728971962616822, "eval_Facility_recall": 0.7243460764587525, "eval_Food_f1": 0.6986301369863014, "eval_Food_number": 214, "eval_Food_precision": 0.6830357142857143, "eval_Food_recall": 0.7149532710280374, "eval_HumanSettlement_f1": 0.8740870581361379, "eval_HumanSettlement_number": 1689, "eval_HumanSettlement_precision": 0.8627450980392157, "eval_HumanSettlement_recall": 0.8857312018946122, "eval_MedicalProcedure_f1": 0.7508771929824561, "eval_MedicalProcedure_number": 142, "eval_MedicalProcedure_precision": 0.7482517482517482, "eval_MedicalProcedure_recall": 0.7535211267605634, "eval_Medication/Vaccine_f1": 0.8075117370892019, "eval_Medication/Vaccine_number": 200, "eval_Medication/Vaccine_precision": 0.7610619469026548, "eval_Medication/Vaccine_recall": 0.86, "eval_MusicalGRP_f1": 0.8031496062992126, "eval_MusicalGRP_number": 372, "eval_MusicalGRP_precision": 0.7846153846153846, "eval_MusicalGRP_recall": 0.8225806451612904, "eval_MusicalWork_f1": 0.7677261613691931, "eval_MusicalWork_number": 407, "eval_MusicalWork_precision": 0.7639902676399026, "eval_MusicalWork_recall": 0.7714987714987716, "eval_ORG_f1": 0.6931137724550898, "eval_ORG_number": 667, "eval_ORG_precision": 0.6920777279521674, "eval_ORG_recall": 0.6941529235382309, "eval_OtherLOC_f1": 0.7511111111111112, "eval_OtherLOC_number": 224, "eval_OtherLOC_precision": 0.7477876106194691, "eval_OtherLOC_recall": 0.7544642857142857, "eval_OtherPER_f1": 0.5484734868773433, "eval_OtherPER_number": 859, "eval_OtherPER_precision": 0.5079365079365079, "eval_OtherPER_recall": 0.5960419091967404, "eval_OtherPROD_f1": 0.642691415313225, "eval_OtherPROD_number": 433, "eval_OtherPROD_precision": 0.6456876456876457, "eval_OtherPROD_recall": 0.6397228637413395, "eval_Politician_f1": 0.6015424164524421, "eval_Politician_number": 603, "eval_Politician_precision": 0.6223404255319149, "eval_Politician_recall": 0.582089552238806, "eval_PrivateCorp_f1": 0.7932489451476793, "eval_PrivateCorp_number": 129, "eval_PrivateCorp_precision": 0.8703703703703703, "eval_PrivateCorp_recall": 0.7286821705426356, "eval_PublicCorp_f1": 0.7372549019607844, "eval_PublicCorp_number": 243, "eval_PublicCorp_precision": 0.704119850187266, "eval_PublicCorp_recall": 0.7736625514403292, "eval_Scientist_f1": 0.5279187817258884, "eval_Scientist_number": 189, "eval_Scientist_precision": 0.5073170731707317, "eval_Scientist_recall": 0.5502645502645502, "eval_Software_f1": 0.7827476038338659, "eval_Software_number": 307, "eval_Software_precision": 0.768025078369906, "eval_Software_recall": 0.7980456026058632, "eval_SportsGRP_f1": 0.876923076923077, "eval_SportsGRP_number": 385, "eval_SportsGRP_precision": 0.8658227848101265, "eval_SportsGRP_recall": 0.8883116883116883, "eval_SportsManager_f1": 0.6844919786096256, "eval_SportsManager_number": 194, "eval_SportsManager_precision": 0.7111111111111111, "eval_SportsManager_recall": 0.6597938144329897, "eval_Station_f1": 0.7930174563591021, "eval_Station_number": 194, "eval_Station_precision": 0.7681159420289855, "eval_Station_recall": 0.8195876288659794, "eval_Symptom_f1": 0.7279693486590039, "eval_Symptom_number": 129, "eval_Symptom_precision": 0.7196969696969697, "eval_Symptom_recall": 0.7364341085271318, "eval_Vehicle_f1": 0.6651685393258426, "eval_Vehicle_number": 206, "eval_Vehicle_precision": 0.6192468619246861, "eval_Vehicle_recall": 0.7184466019417476, "eval_VisualWork_f1": 0.8056737588652482, "eval_VisualWork_number": 693, "eval_VisualWork_precision": 0.7921896792189679, "eval_VisualWork_recall": 0.8196248196248196, "eval_WrittenWork_f1": 0.72, "eval_WrittenWork_number": 563, "eval_WrittenWork_precision": 0.7206405693950177, "eval_WrittenWork_recall": 0.7193605683836589, "eval_loss": 0.286215603351593, "eval_overall_accuracy": 0.9423628444533446, "eval_overall_f1": 0.7423728813559323, "eval_overall_precision": 0.7281532345500542, "eval_overall_recall": 0.7571589627959414, "eval_runtime": 44.0314, "eval_samples_per_second": 202.015, "eval_steps_per_second": 25.255, "step": 213530 }, { "epoch": 10.02, "learning_rate": 3.318659360901669e-06, "loss": 0.057, "step": 214000 }, { "epoch": 10.05, "learning_rate": 3.3030487519318132e-06, "loss": 0.0545, "step": 214500 }, { "epoch": 10.07, "learning_rate": 3.2874381429619573e-06, "loss": 0.0518, "step": 215000 }, { "epoch": 10.09, "learning_rate": 3.2718275339921013e-06, "loss": 0.0559, "step": 215500 }, { "epoch": 10.12, "learning_rate": 3.2562169250222453e-06, "loss": 0.0545, "step": 216000 }, { "epoch": 10.14, "learning_rate": 3.2406063160523894e-06, "loss": 0.0555, "step": 216500 }, { "epoch": 10.16, "learning_rate": 3.2249957070825334e-06, "loss": 0.0547, "step": 217000 }, { "epoch": 10.19, "learning_rate": 3.209385098112678e-06, "loss": 0.0532, "step": 217500 }, { "epoch": 10.21, "learning_rate": 3.193774489142822e-06, "loss": 0.0498, "step": 218000 }, { "epoch": 10.23, "learning_rate": 3.178163880172966e-06, "loss": 0.0589, "step": 218500 }, { "epoch": 10.26, "learning_rate": 3.16255327120311e-06, "loss": 0.0556, "step": 219000 }, { "epoch": 10.28, "learning_rate": 3.1469426622332537e-06, "loss": 0.0523, "step": 219500 }, { "epoch": 10.3, "learning_rate": 3.1313320532633977e-06, "loss": 0.0543, "step": 220000 }, { "epoch": 10.33, "learning_rate": 3.1157214442935426e-06, "loss": 0.0508, "step": 220500 }, { "epoch": 10.35, "learning_rate": 3.1001108353236862e-06, "loss": 0.0554, "step": 221000 }, { "epoch": 10.37, "learning_rate": 3.0845002263538303e-06, "loss": 0.0552, "step": 221500 }, { "epoch": 10.4, "learning_rate": 3.0688896173839743e-06, "loss": 0.0563, "step": 222000 }, { "epoch": 10.42, "learning_rate": 3.0532790084141184e-06, "loss": 0.0545, "step": 222500 }, { "epoch": 10.44, "learning_rate": 3.0376683994442624e-06, "loss": 0.0521, "step": 223000 }, { "epoch": 10.47, "learning_rate": 3.0220577904744065e-06, "loss": 0.0528, "step": 223500 }, { "epoch": 10.49, "learning_rate": 3.006447181504551e-06, "loss": 0.0554, "step": 224000 }, { "epoch": 10.51, "learning_rate": 2.990836572534695e-06, "loss": 0.0561, "step": 224500 }, { "epoch": 10.54, "learning_rate": 2.975225963564839e-06, "loss": 0.0598, "step": 225000 }, { "epoch": 10.56, "learning_rate": 2.959615354594983e-06, "loss": 0.0532, "step": 225500 }, { "epoch": 10.58, "learning_rate": 2.944004745625127e-06, "loss": 0.0607, "step": 226000 }, { "epoch": 10.61, "learning_rate": 2.928394136655271e-06, "loss": 0.0554, "step": 226500 }, { "epoch": 10.63, "learning_rate": 2.9127835276854156e-06, "loss": 0.053, "step": 227000 }, { "epoch": 10.65, "learning_rate": 2.8971729187155597e-06, "loss": 0.0567, "step": 227500 }, { "epoch": 10.68, "learning_rate": 2.8815623097457037e-06, "loss": 0.0531, "step": 228000 }, { "epoch": 10.7, "learning_rate": 2.8659517007758473e-06, "loss": 0.0549, "step": 228500 }, { "epoch": 10.72, "learning_rate": 2.8503410918059914e-06, "loss": 0.0547, "step": 229000 }, { "epoch": 10.75, "learning_rate": 2.8347304828361354e-06, "loss": 0.0561, "step": 229500 }, { "epoch": 10.77, "learning_rate": 2.8191198738662795e-06, "loss": 0.0603, "step": 230000 }, { "epoch": 10.79, "learning_rate": 2.803509264896424e-06, "loss": 0.0557, "step": 230500 }, { "epoch": 10.82, "learning_rate": 2.787898655926568e-06, "loss": 0.0521, "step": 231000 }, { "epoch": 10.84, "learning_rate": 2.772288046956712e-06, "loss": 0.0587, "step": 231500 }, { "epoch": 10.86, "learning_rate": 2.756677437986856e-06, "loss": 0.0524, "step": 232000 }, { "epoch": 10.89, "learning_rate": 2.741066829017e-06, "loss": 0.0552, "step": 232500 }, { "epoch": 10.91, "learning_rate": 2.725456220047144e-06, "loss": 0.0577, "step": 233000 }, { "epoch": 10.94, "learning_rate": 2.7098456110772886e-06, "loss": 0.0582, "step": 233500 }, { "epoch": 10.96, "learning_rate": 2.6942350021074327e-06, "loss": 0.0557, "step": 234000 }, { "epoch": 10.98, "learning_rate": 2.6786243931375767e-06, "loss": 0.0568, "step": 234500 }, { "epoch": 11.0, "eval_AerospaceManufacturer_f1": 0.8413793103448277, "eval_AerospaceManufacturer_number": 138, "eval_AerospaceManufacturer_precision": 0.8026315789473685, "eval_AerospaceManufacturer_recall": 0.8840579710144928, "eval_AnatomicalStructure_f1": 0.7602591792656587, "eval_AnatomicalStructure_number": 227, "eval_AnatomicalStructure_precision": 0.7457627118644068, "eval_AnatomicalStructure_recall": 0.775330396475771, "eval_ArtWork_f1": 0.6470588235294118, "eval_ArtWork_number": 131, "eval_ArtWork_precision": 0.624113475177305, "eval_ArtWork_recall": 0.6717557251908397, "eval_Artist_f1": 0.7980877390326209, "eval_Artist_number": 1722, "eval_Artist_precision": 0.7737186477644493, "eval_Artist_recall": 0.8240418118466899, "eval_Athlete_f1": 0.7549295774647888, "eval_Athlete_number": 719, "eval_Athlete_precision": 0.7646219686162625, "eval_Athlete_recall": 0.7454798331015299, "eval_CarManufacturer_f1": 0.8271604938271604, "eval_CarManufacturer_number": 159, "eval_CarManufacturer_precision": 0.8121212121212121, "eval_CarManufacturer_recall": 0.8427672955974843, "eval_Cleric_f1": 0.6279683377308706, "eval_Cleric_number": 201, "eval_Cleric_precision": 0.6685393258426966, "eval_Cleric_recall": 0.5920398009950248, "eval_Clothing_f1": 0.6502057613168724, "eval_Clothing_number": 128, "eval_Clothing_precision": 0.6869565217391305, "eval_Clothing_recall": 0.6171875, "eval_Disease_f1": 0.7058823529411765, "eval_Disease_number": 198, "eval_Disease_precision": 0.7150259067357513, "eval_Disease_recall": 0.696969696969697, "eval_Drink_f1": 0.7816901408450705, "eval_Drink_number": 143, "eval_Drink_precision": 0.7872340425531915, "eval_Drink_recall": 0.7762237762237763, "eval_Facility_f1": 0.7032136105860114, "eval_Facility_number": 497, "eval_Facility_precision": 0.6631016042780749, "eval_Facility_recall": 0.7484909456740443, "eval_Food_f1": 0.6761229314420804, "eval_Food_number": 214, "eval_Food_precision": 0.6842105263157895, "eval_Food_recall": 0.6682242990654206, "eval_HumanSettlement_f1": 0.8709112149532711, "eval_HumanSettlement_number": 1689, "eval_HumanSettlement_precision": 0.8593659942363112, "eval_HumanSettlement_recall": 0.8827708703374778, "eval_MedicalProcedure_f1": 0.7545787545787546, "eval_MedicalProcedure_number": 142, "eval_MedicalProcedure_precision": 0.7862595419847328, "eval_MedicalProcedure_recall": 0.7253521126760564, "eval_Medication/Vaccine_f1": 0.8125, "eval_Medication/Vaccine_number": 200, "eval_Medication/Vaccine_precision": 0.7824074074074074, "eval_Medication/Vaccine_recall": 0.845, "eval_MusicalGRP_f1": 0.7827225130890051, "eval_MusicalGRP_number": 372, "eval_MusicalGRP_precision": 0.7627551020408163, "eval_MusicalGRP_recall": 0.803763440860215, "eval_MusicalWork_f1": 0.7701711491442543, "eval_MusicalWork_number": 407, "eval_MusicalWork_precision": 0.7664233576642335, "eval_MusicalWork_recall": 0.773955773955774, "eval_ORG_f1": 0.69969040247678, "eval_ORG_number": 667, "eval_ORG_precision": 0.7232, "eval_ORG_recall": 0.6776611694152923, "eval_OtherLOC_f1": 0.7586206896551725, "eval_OtherLOC_number": 224, "eval_OtherLOC_precision": 0.7819905213270142, "eval_OtherLOC_recall": 0.7366071428571429, "eval_OtherPER_f1": 0.5640176600441501, "eval_OtherPER_number": 859, "eval_OtherPER_precision": 0.5362014690451207, "eval_OtherPER_recall": 0.5948777648428405, "eval_OtherPROD_f1": 0.6385404789053591, "eval_OtherPROD_number": 433, "eval_OtherPROD_precision": 0.6306306306306306, "eval_OtherPROD_recall": 0.6466512702078522, "eval_Politician_f1": 0.6156521739130435, "eval_Politician_number": 603, "eval_Politician_precision": 0.6471663619744058, "eval_Politician_recall": 0.5870646766169154, "eval_PrivateCorp_f1": 0.7948717948717948, "eval_PrivateCorp_number": 129, "eval_PrivateCorp_precision": 0.8857142857142857, "eval_PrivateCorp_recall": 0.7209302325581395, "eval_PublicCorp_f1": 0.7499999999999999, "eval_PublicCorp_number": 243, "eval_PublicCorp_precision": 0.7137546468401487, "eval_PublicCorp_recall": 0.7901234567901234, "eval_Scientist_f1": 0.5230769230769231, "eval_Scientist_number": 189, "eval_Scientist_precision": 0.5074626865671642, "eval_Scientist_recall": 0.5396825396825397, "eval_Software_f1": 0.7922705314009663, "eval_Software_number": 307, "eval_Software_precision": 0.7834394904458599, "eval_Software_recall": 0.8013029315960912, "eval_SportsGRP_f1": 0.8756345177664975, "eval_SportsGRP_number": 385, "eval_SportsGRP_precision": 0.8560794044665012, "eval_SportsGRP_recall": 0.8961038961038961, "eval_SportsManager_f1": 0.6701570680628272, "eval_SportsManager_number": 194, "eval_SportsManager_precision": 0.6808510638297872, "eval_SportsManager_recall": 0.6597938144329897, "eval_Station_f1": 0.794044665012407, "eval_Station_number": 194, "eval_Station_precision": 0.7655502392344498, "eval_Station_recall": 0.8247422680412371, "eval_Symptom_f1": 0.7106227106227105, "eval_Symptom_number": 129, "eval_Symptom_precision": 0.6736111111111112, "eval_Symptom_recall": 0.751937984496124, "eval_Vehicle_f1": 0.638095238095238, "eval_Vehicle_number": 206, "eval_Vehicle_precision": 0.6261682242990654, "eval_Vehicle_recall": 0.6504854368932039, "eval_VisualWork_f1": 0.8048090523338047, "eval_VisualWork_number": 693, "eval_VisualWork_precision": 0.7891816920943134, "eval_VisualWork_recall": 0.8210678210678211, "eval_WrittenWork_f1": 0.7326007326007326, "eval_WrittenWork_number": 563, "eval_WrittenWork_precision": 0.7561436672967864, "eval_WrittenWork_recall": 0.7104795737122558, "eval_loss": 0.2950502634048462, "eval_overall_accuracy": 0.9431137938679617, "eval_overall_f1": 0.7468114379206485, "eval_overall_precision": 0.7390344421548425, "eval_overall_recall": 0.7547538519353626, "eval_runtime": 46.9377, "eval_samples_per_second": 189.507, "eval_steps_per_second": 23.691, "step": 234883 }, { "epoch": 11.01, "learning_rate": 2.6630137841677208e-06, "loss": 0.0546, "step": 235000 }, { "epoch": 11.03, "learning_rate": 2.647403175197865e-06, "loss": 0.0445, "step": 235500 }, { "epoch": 11.05, "learning_rate": 2.6317925662280084e-06, "loss": 0.0457, "step": 236000 }, { "epoch": 11.08, "learning_rate": 2.6161819572581525e-06, "loss": 0.0463, "step": 236500 }, { "epoch": 11.1, "learning_rate": 2.6005713482882974e-06, "loss": 0.0441, "step": 237000 }, { "epoch": 11.12, "learning_rate": 2.584960739318441e-06, "loss": 0.0497, "step": 237500 }, { "epoch": 11.15, "learning_rate": 2.569350130348585e-06, "loss": 0.0483, "step": 238000 }, { "epoch": 11.17, "learning_rate": 2.553739521378729e-06, "loss": 0.047, "step": 238500 }, { "epoch": 11.19, "learning_rate": 2.538128912408873e-06, "loss": 0.0447, "step": 239000 }, { "epoch": 11.22, "learning_rate": 2.522518303439017e-06, "loss": 0.0461, "step": 239500 }, { "epoch": 11.24, "learning_rate": 2.5069076944691616e-06, "loss": 0.0483, "step": 240000 }, { "epoch": 11.26, "learning_rate": 2.4912970854993053e-06, "loss": 0.0441, "step": 240500 }, { "epoch": 11.29, "learning_rate": 2.4756864765294497e-06, "loss": 0.0521, "step": 241000 }, { "epoch": 11.31, "learning_rate": 2.4600758675595938e-06, "loss": 0.0488, "step": 241500 }, { "epoch": 11.33, "learning_rate": 2.444465258589738e-06, "loss": 0.0481, "step": 242000 }, { "epoch": 11.36, "learning_rate": 2.428854649619882e-06, "loss": 0.0507, "step": 242500 }, { "epoch": 11.38, "learning_rate": 2.413244040650026e-06, "loss": 0.0519, "step": 243000 }, { "epoch": 11.4, "learning_rate": 2.39763343168017e-06, "loss": 0.0478, "step": 243500 }, { "epoch": 11.43, "learning_rate": 2.382022822710314e-06, "loss": 0.0466, "step": 244000 }, { "epoch": 11.45, "learning_rate": 2.3664122137404585e-06, "loss": 0.0447, "step": 244500 }, { "epoch": 11.47, "learning_rate": 2.350801604770602e-06, "loss": 0.0498, "step": 245000 }, { "epoch": 11.5, "learning_rate": 2.335190995800746e-06, "loss": 0.0496, "step": 245500 }, { "epoch": 11.52, "learning_rate": 2.3195803868308906e-06, "loss": 0.0477, "step": 246000 }, { "epoch": 11.54, "learning_rate": 2.3039697778610347e-06, "loss": 0.0474, "step": 246500 }, { "epoch": 11.57, "learning_rate": 2.2883591688911787e-06, "loss": 0.0477, "step": 247000 }, { "epoch": 11.59, "learning_rate": 2.2727485599213227e-06, "loss": 0.0494, "step": 247500 }, { "epoch": 11.61, "learning_rate": 2.257137950951467e-06, "loss": 0.0478, "step": 248000 }, { "epoch": 11.64, "learning_rate": 2.241527341981611e-06, "loss": 0.0505, "step": 248500 }, { "epoch": 11.66, "learning_rate": 2.225916733011755e-06, "loss": 0.0492, "step": 249000 }, { "epoch": 11.68, "learning_rate": 2.210306124041899e-06, "loss": 0.0503, "step": 249500 }, { "epoch": 11.71, "learning_rate": 2.194695515072043e-06, "loss": 0.0468, "step": 250000 }, { "epoch": 11.73, "learning_rate": 2.179084906102187e-06, "loss": 0.0527, "step": 250500 }, { "epoch": 11.75, "learning_rate": 2.1634742971323315e-06, "loss": 0.0511, "step": 251000 }, { "epoch": 11.78, "learning_rate": 2.1478636881624755e-06, "loss": 0.0499, "step": 251500 }, { "epoch": 11.8, "learning_rate": 2.1322530791926196e-06, "loss": 0.0508, "step": 252000 }, { "epoch": 11.83, "learning_rate": 2.1166424702227636e-06, "loss": 0.0463, "step": 252500 }, { "epoch": 11.85, "learning_rate": 2.1010318612529077e-06, "loss": 0.0495, "step": 253000 }, { "epoch": 11.87, "learning_rate": 2.0854212522830517e-06, "loss": 0.045, "step": 253500 }, { "epoch": 11.9, "learning_rate": 2.0698106433131958e-06, "loss": 0.0501, "step": 254000 }, { "epoch": 11.92, "learning_rate": 2.05420003434334e-06, "loss": 0.0475, "step": 254500 }, { "epoch": 11.94, "learning_rate": 2.038589425373484e-06, "loss": 0.0535, "step": 255000 }, { "epoch": 11.97, "learning_rate": 2.0229788164036283e-06, "loss": 0.0493, "step": 255500 }, { "epoch": 11.99, "learning_rate": 2.0073682074337724e-06, "loss": 0.0465, "step": 256000 }, { "epoch": 12.0, "eval_AerospaceManufacturer_f1": 0.8668941979522183, "eval_AerospaceManufacturer_number": 138, "eval_AerospaceManufacturer_precision": 0.8193548387096774, "eval_AerospaceManufacturer_recall": 0.9202898550724637, "eval_AnatomicalStructure_f1": 0.7453416149068323, "eval_AnatomicalStructure_number": 227, "eval_AnatomicalStructure_precision": 0.703125, "eval_AnatomicalStructure_recall": 0.7929515418502202, "eval_ArtWork_f1": 0.6263345195729537, "eval_ArtWork_number": 131, "eval_ArtWork_precision": 0.5866666666666667, "eval_ArtWork_recall": 0.6717557251908397, "eval_Artist_f1": 0.8015873015873015, "eval_Artist_number": 1722, "eval_Artist_precision": 0.7829457364341085, "eval_Artist_recall": 0.8211382113821138, "eval_Athlete_f1": 0.749648382559775, "eval_Athlete_number": 719, "eval_Athlete_precision": 0.7581792318634424, "eval_Athlete_recall": 0.741307371349096, "eval_CarManufacturer_f1": 0.8328267477203647, "eval_CarManufacturer_number": 159, "eval_CarManufacturer_precision": 0.8058823529411765, "eval_CarManufacturer_recall": 0.8616352201257862, "eval_Cleric_f1": 0.6263157894736842, "eval_Cleric_number": 201, "eval_Cleric_precision": 0.664804469273743, "eval_Cleric_recall": 0.5920398009950248, "eval_Clothing_f1": 0.6434108527131783, "eval_Clothing_number": 128, "eval_Clothing_precision": 0.6384615384615384, "eval_Clothing_recall": 0.6484375, "eval_Disease_f1": 0.6995073891625616, "eval_Disease_number": 198, "eval_Disease_precision": 0.6826923076923077, "eval_Disease_recall": 0.7171717171717171, "eval_Drink_f1": 0.8040540540540541, "eval_Drink_number": 143, "eval_Drink_precision": 0.7777777777777778, "eval_Drink_recall": 0.8321678321678322, "eval_Facility_f1": 0.6986564299424184, "eval_Facility_number": 497, "eval_Facility_precision": 0.6678899082568808, "eval_Facility_recall": 0.7323943661971831, "eval_Food_f1": 0.6958525345622121, "eval_Food_number": 214, "eval_Food_precision": 0.6863636363636364, "eval_Food_recall": 0.705607476635514, "eval_HumanSettlement_f1": 0.8683602771362587, "eval_HumanSettlement_number": 1689, "eval_HumanSettlement_precision": 0.8473239436619718, "eval_HumanSettlement_recall": 0.8904677323860273, "eval_MedicalProcedure_f1": 0.7578947368421053, "eval_MedicalProcedure_number": 142, "eval_MedicalProcedure_precision": 0.7552447552447552, "eval_MedicalProcedure_recall": 0.7605633802816901, "eval_Medication/Vaccine_f1": 0.7954022988505746, "eval_Medication/Vaccine_number": 200, "eval_Medication/Vaccine_precision": 0.7361702127659574, "eval_Medication/Vaccine_recall": 0.865, "eval_MusicalGRP_f1": 0.774025974025974, "eval_MusicalGRP_number": 372, "eval_MusicalGRP_precision": 0.7487437185929648, "eval_MusicalGRP_recall": 0.8010752688172043, "eval_MusicalWork_f1": 0.7614457831325302, "eval_MusicalWork_number": 407, "eval_MusicalWork_precision": 0.7470449172576832, "eval_MusicalWork_recall": 0.7764127764127764, "eval_ORG_f1": 0.7036759189797449, "eval_ORG_number": 667, "eval_ORG_precision": 0.7042042042042042, "eval_ORG_recall": 0.7031484257871065, "eval_OtherLOC_f1": 0.7533039647577092, "eval_OtherLOC_number": 224, "eval_OtherLOC_precision": 0.7434782608695653, "eval_OtherLOC_recall": 0.7633928571428571, "eval_OtherPER_f1": 0.5639013452914798, "eval_OtherPER_number": 859, "eval_OtherPER_precision": 0.5437837837837838, "eval_OtherPER_recall": 0.5855646100116414, "eval_OtherPROD_f1": 0.6395480225988701, "eval_OtherPROD_number": 433, "eval_OtherPROD_precision": 0.6261061946902655, "eval_OtherPROD_recall": 0.6535796766743649, "eval_Politician_f1": 0.6311336717428088, "eval_Politician_number": 603, "eval_Politician_precision": 0.6442141623488774, "eval_Politician_recall": 0.6185737976782753, "eval_PrivateCorp_f1": 0.7883817427385893, "eval_PrivateCorp_number": 129, "eval_PrivateCorp_precision": 0.8482142857142857, "eval_PrivateCorp_recall": 0.7364341085271318, "eval_PublicCorp_f1": 0.744466800804829, "eval_PublicCorp_number": 243, "eval_PublicCorp_precision": 0.7283464566929134, "eval_PublicCorp_recall": 0.7613168724279835, "eval_Scientist_f1": 0.5230769230769231, "eval_Scientist_number": 189, "eval_Scientist_precision": 0.5074626865671642, "eval_Scientist_recall": 0.5396825396825397, "eval_Software_f1": 0.7915309446254072, "eval_Software_number": 307, "eval_Software_precision": 0.7915309446254072, "eval_Software_recall": 0.7915309446254072, "eval_SportsGRP_f1": 0.8770595690747781, "eval_SportsGRP_number": 385, "eval_SportsGRP_precision": 0.8564356435643564, "eval_SportsGRP_recall": 0.8987012987012987, "eval_SportsManager_f1": 0.669833729216152, "eval_SportsManager_number": 194, "eval_SportsManager_precision": 0.6211453744493393, "eval_SportsManager_recall": 0.7268041237113402, "eval_Station_f1": 0.7880299251870324, "eval_Station_number": 194, "eval_Station_precision": 0.7632850241545893, "eval_Station_recall": 0.8144329896907216, "eval_Symptom_f1": 0.7452471482889734, "eval_Symptom_number": 129, "eval_Symptom_precision": 0.7313432835820896, "eval_Symptom_recall": 0.7596899224806202, "eval_Vehicle_f1": 0.6819221967963387, "eval_Vehicle_number": 206, "eval_Vehicle_precision": 0.645021645021645, "eval_Vehicle_recall": 0.7233009708737864, "eval_VisualWork_f1": 0.7943661971830986, "eval_VisualWork_number": 693, "eval_VisualWork_precision": 0.7757909215955984, "eval_VisualWork_recall": 0.8138528138528138, "eval_WrittenWork_f1": 0.7182222222222222, "eval_WrittenWork_number": 563, "eval_WrittenWork_precision": 0.7188612099644128, "eval_WrittenWork_recall": 0.7175843694493783, "eval_loss": 0.3102704882621765, "eval_overall_accuracy": 0.9427991103037412, "eval_overall_f1": 0.7463565435006624, "eval_overall_precision": 0.7312324222975409, "eval_overall_recall": 0.762119503945885, "eval_runtime": 45.9941, "eval_samples_per_second": 193.394, "eval_steps_per_second": 24.177, "step": 256236 }, { "epoch": 12.01, "learning_rate": 1.9917575984639164e-06, "loss": 0.0447, "step": 256500 }, { "epoch": 12.04, "learning_rate": 1.97614698949406e-06, "loss": 0.0446, "step": 257000 }, { "epoch": 12.06, "learning_rate": 1.9605363805242045e-06, "loss": 0.0414, "step": 257500 }, { "epoch": 12.08, "learning_rate": 1.9449257715543485e-06, "loss": 0.0422, "step": 258000 }, { "epoch": 12.11, "learning_rate": 1.9293151625844926e-06, "loss": 0.0386, "step": 258500 }, { "epoch": 12.13, "learning_rate": 1.9137045536146366e-06, "loss": 0.0446, "step": 259000 }, { "epoch": 12.15, "learning_rate": 1.8980939446447807e-06, "loss": 0.0443, "step": 259500 }, { "epoch": 12.18, "learning_rate": 1.8824833356749247e-06, "loss": 0.0426, "step": 260000 }, { "epoch": 12.2, "learning_rate": 1.866872726705069e-06, "loss": 0.0452, "step": 260500 }, { "epoch": 12.22, "learning_rate": 1.851262117735213e-06, "loss": 0.0447, "step": 261000 }, { "epoch": 12.25, "learning_rate": 1.835651508765357e-06, "loss": 0.0384, "step": 261500 }, { "epoch": 12.27, "learning_rate": 1.8200408997955013e-06, "loss": 0.0427, "step": 262000 }, { "epoch": 12.29, "learning_rate": 1.8044302908256454e-06, "loss": 0.0469, "step": 262500 }, { "epoch": 12.32, "learning_rate": 1.7888196818557892e-06, "loss": 0.0424, "step": 263000 }, { "epoch": 12.34, "learning_rate": 1.7732090728859333e-06, "loss": 0.0421, "step": 263500 }, { "epoch": 12.36, "learning_rate": 1.7575984639160775e-06, "loss": 0.0443, "step": 264000 }, { "epoch": 12.39, "learning_rate": 1.7419878549462216e-06, "loss": 0.0469, "step": 264500 }, { "epoch": 12.41, "learning_rate": 1.7263772459763656e-06, "loss": 0.0441, "step": 265000 }, { "epoch": 12.43, "learning_rate": 1.7107666370065099e-06, "loss": 0.0408, "step": 265500 }, { "epoch": 12.46, "learning_rate": 1.695156028036654e-06, "loss": 0.042, "step": 266000 }, { "epoch": 12.48, "learning_rate": 1.679545419066798e-06, "loss": 0.0425, "step": 266500 }, { "epoch": 12.5, "learning_rate": 1.6639348100969422e-06, "loss": 0.0435, "step": 267000 }, { "epoch": 12.53, "learning_rate": 1.648324201127086e-06, "loss": 0.0441, "step": 267500 }, { "epoch": 12.55, "learning_rate": 1.63271359215723e-06, "loss": 0.0461, "step": 268000 }, { "epoch": 12.57, "learning_rate": 1.6171029831873743e-06, "loss": 0.0445, "step": 268500 }, { "epoch": 12.6, "learning_rate": 1.6014923742175184e-06, "loss": 0.0475, "step": 269000 }, { "epoch": 12.62, "learning_rate": 1.5858817652476624e-06, "loss": 0.0473, "step": 269500 }, { "epoch": 12.64, "learning_rate": 1.5702711562778065e-06, "loss": 0.0404, "step": 270000 }, { "epoch": 12.67, "learning_rate": 1.5546605473079507e-06, "loss": 0.0408, "step": 270500 }, { "epoch": 12.69, "learning_rate": 1.5390499383380948e-06, "loss": 0.0449, "step": 271000 }, { "epoch": 12.71, "learning_rate": 1.5234393293682386e-06, "loss": 0.0463, "step": 271500 }, { "epoch": 12.74, "learning_rate": 1.5078287203983829e-06, "loss": 0.0413, "step": 272000 }, { "epoch": 12.76, "learning_rate": 1.492218111428527e-06, "loss": 0.0445, "step": 272500 }, { "epoch": 12.79, "learning_rate": 1.476607502458671e-06, "loss": 0.0439, "step": 273000 }, { "epoch": 12.81, "learning_rate": 1.4609968934888152e-06, "loss": 0.0426, "step": 273500 }, { "epoch": 12.83, "learning_rate": 1.4453862845189593e-06, "loss": 0.0427, "step": 274000 }, { "epoch": 12.86, "learning_rate": 1.4297756755491033e-06, "loss": 0.0421, "step": 274500 }, { "epoch": 12.88, "learning_rate": 1.4141650665792471e-06, "loss": 0.0425, "step": 275000 }, { "epoch": 12.9, "learning_rate": 1.3985544576093916e-06, "loss": 0.0442, "step": 275500 }, { "epoch": 12.93, "learning_rate": 1.3829438486395354e-06, "loss": 0.0426, "step": 276000 }, { "epoch": 12.95, "learning_rate": 1.3673332396696795e-06, "loss": 0.0445, "step": 276500 }, { "epoch": 12.97, "learning_rate": 1.3517226306998238e-06, "loss": 0.0461, "step": 277000 }, { "epoch": 13.0, "learning_rate": 1.3361120217299678e-06, "loss": 0.0459, "step": 277500 }, { "epoch": 13.0, "eval_AerospaceManufacturer_f1": 0.8611111111111112, "eval_AerospaceManufacturer_number": 138, "eval_AerospaceManufacturer_precision": 0.8266666666666667, "eval_AerospaceManufacturer_recall": 0.8985507246376812, "eval_AnatomicalStructure_f1": 0.751592356687898, "eval_AnatomicalStructure_number": 227, "eval_AnatomicalStructure_precision": 0.7254098360655737, "eval_AnatomicalStructure_recall": 0.7797356828193832, "eval_ArtWork_f1": 0.6323529411764706, "eval_ArtWork_number": 131, "eval_ArtWork_precision": 0.6099290780141844, "eval_ArtWork_recall": 0.6564885496183206, "eval_Artist_f1": 0.8053729637039154, "eval_Artist_number": 1722, "eval_Artist_precision": 0.7929093978615644, "eval_Artist_recall": 0.8182346109175378, "eval_Athlete_f1": 0.761904761904762, "eval_Athlete_number": 719, "eval_Athlete_precision": 0.7561643835616438, "eval_Athlete_recall": 0.7677329624478443, "eval_CarManufacturer_f1": 0.8282208588957056, "eval_CarManufacturer_number": 159, "eval_CarManufacturer_precision": 0.8083832335329342, "eval_CarManufacturer_recall": 0.8490566037735849, "eval_Cleric_f1": 0.6157760814249363, "eval_Cleric_number": 201, "eval_Cleric_precision": 0.6302083333333334, "eval_Cleric_recall": 0.6019900497512438, "eval_Clothing_f1": 0.6486486486486486, "eval_Clothing_number": 128, "eval_Clothing_precision": 0.6412213740458015, "eval_Clothing_recall": 0.65625, "eval_Disease_f1": 0.7000000000000001, "eval_Disease_number": 198, "eval_Disease_precision": 0.693069306930693, "eval_Disease_recall": 0.7070707070707071, "eval_Drink_f1": 0.7903780068728522, "eval_Drink_number": 143, "eval_Drink_precision": 0.777027027027027, "eval_Drink_recall": 0.8041958041958042, "eval_Facility_f1": 0.7098646034816248, "eval_Facility_number": 497, "eval_Facility_precision": 0.6834264432029795, "eval_Facility_recall": 0.738430583501006, "eval_Food_f1": 0.691764705882353, "eval_Food_number": 214, "eval_Food_precision": 0.6966824644549763, "eval_Food_recall": 0.6869158878504673, "eval_HumanSettlement_f1": 0.8736842105263158, "eval_HumanSettlement_number": 1689, "eval_HumanSettlement_precision": 0.8630849220103987, "eval_HumanSettlement_recall": 0.8845470692717584, "eval_MedicalProcedure_f1": 0.761904761904762, "eval_MedicalProcedure_number": 142, "eval_MedicalProcedure_precision": 0.7938931297709924, "eval_MedicalProcedure_recall": 0.7323943661971831, "eval_Medication/Vaccine_f1": 0.8058252427184467, "eval_Medication/Vaccine_number": 200, "eval_Medication/Vaccine_precision": 0.7830188679245284, "eval_Medication/Vaccine_recall": 0.83, "eval_MusicalGRP_f1": 0.7915006640106241, "eval_MusicalGRP_number": 372, "eval_MusicalGRP_precision": 0.7821522309711286, "eval_MusicalGRP_recall": 0.8010752688172043, "eval_MusicalWork_f1": 0.7608695652173912, "eval_MusicalWork_number": 407, "eval_MusicalWork_precision": 0.7482185273159145, "eval_MusicalWork_recall": 0.773955773955774, "eval_ORG_f1": 0.6976744186046512, "eval_ORG_number": 667, "eval_ORG_precision": 0.6981981981981982, "eval_ORG_recall": 0.697151424287856, "eval_OtherLOC_f1": 0.7632183908045976, "eval_OtherLOC_number": 224, "eval_OtherLOC_precision": 0.7867298578199052, "eval_OtherLOC_recall": 0.7410714285714286, "eval_OtherPER_f1": 0.5576496674057649, "eval_OtherPER_number": 859, "eval_OtherPER_precision": 0.5322751322751322, "eval_OtherPER_recall": 0.5855646100116414, "eval_OtherPROD_f1": 0.6513761467889909, "eval_OtherPROD_number": 433, "eval_OtherPROD_precision": 0.6469248291571754, "eval_OtherPROD_recall": 0.6558891454965358, "eval_Politician_f1": 0.6265060240963854, "eval_Politician_number": 603, "eval_Politician_precision": 0.6511627906976745, "eval_Politician_recall": 0.603648424543947, "eval_PrivateCorp_f1": 0.7848101265822784, "eval_PrivateCorp_number": 129, "eval_PrivateCorp_precision": 0.8611111111111112, "eval_PrivateCorp_recall": 0.7209302325581395, "eval_PublicCorp_f1": 0.750499001996008, "eval_PublicCorp_number": 243, "eval_PublicCorp_precision": 0.7286821705426356, "eval_PublicCorp_recall": 0.7736625514403292, "eval_Scientist_f1": 0.5185185185185185, "eval_Scientist_number": 189, "eval_Scientist_precision": 0.5185185185185185, "eval_Scientist_recall": 0.5185185185185185, "eval_Software_f1": 0.796116504854369, "eval_Software_number": 307, "eval_Software_precision": 0.7909967845659164, "eval_Software_recall": 0.8013029315960912, "eval_SportsGRP_f1": 0.8849104859335039, "eval_SportsGRP_number": 385, "eval_SportsGRP_precision": 0.871536523929471, "eval_SportsGRP_recall": 0.8987012987012987, "eval_SportsManager_f1": 0.7089947089947088, "eval_SportsManager_number": 194, "eval_SportsManager_precision": 0.7282608695652174, "eval_SportsManager_recall": 0.6907216494845361, "eval_Station_f1": 0.7719298245614034, "eval_Station_number": 194, "eval_Station_precision": 0.751219512195122, "eval_Station_recall": 0.7938144329896907, "eval_Symptom_f1": 0.7452471482889734, "eval_Symptom_number": 129, "eval_Symptom_precision": 0.7313432835820896, "eval_Symptom_recall": 0.7596899224806202, "eval_Vehicle_f1": 0.6498855835240275, "eval_Vehicle_number": 206, "eval_Vehicle_precision": 0.6147186147186147, "eval_Vehicle_recall": 0.6893203883495146, "eval_VisualWork_f1": 0.8104667609618105, "eval_VisualWork_number": 693, "eval_VisualWork_precision": 0.7947295423023578, "eval_VisualWork_recall": 0.8268398268398268, "eval_WrittenWork_f1": 0.7208480565371026, "eval_WrittenWork_number": 563, "eval_WrittenWork_precision": 0.7170474516695958, "eval_WrittenWork_recall": 0.7246891651865008, "eval_loss": 0.3141169548034668, "eval_overall_accuracy": 0.9436358825086002, "eval_overall_f1": 0.7495730937708813, "eval_overall_precision": 0.7405560038142742, "eval_overall_recall": 0.7588124765125892, "eval_runtime": 43.7803, "eval_samples_per_second": 203.173, "eval_steps_per_second": 25.4, "step": 277589 }, { "epoch": 13.02, "learning_rate": 1.3205014127601118e-06, "loss": 0.0391, "step": 278000 }, { "epoch": 13.04, "learning_rate": 1.304890803790256e-06, "loss": 0.0343, "step": 278500 }, { "epoch": 13.07, "learning_rate": 1.2892801948204001e-06, "loss": 0.0363, "step": 279000 }, { "epoch": 13.09, "learning_rate": 1.273669585850544e-06, "loss": 0.0386, "step": 279500 }, { "epoch": 13.11, "learning_rate": 1.2580589768806884e-06, "loss": 0.0364, "step": 280000 }, { "epoch": 13.14, "learning_rate": 1.2424483679108323e-06, "loss": 0.0429, "step": 280500 }, { "epoch": 13.16, "learning_rate": 1.2268377589409763e-06, "loss": 0.0393, "step": 281000 }, { "epoch": 13.18, "learning_rate": 1.2112271499711206e-06, "loss": 0.0364, "step": 281500 }, { "epoch": 13.21, "learning_rate": 1.1956165410012646e-06, "loss": 0.0402, "step": 282000 }, { "epoch": 13.23, "learning_rate": 1.1800059320314087e-06, "loss": 0.0386, "step": 282500 }, { "epoch": 13.25, "learning_rate": 1.1643953230615527e-06, "loss": 0.0412, "step": 283000 }, { "epoch": 13.28, "learning_rate": 1.1487847140916968e-06, "loss": 0.0374, "step": 283500 }, { "epoch": 13.3, "learning_rate": 1.1331741051218408e-06, "loss": 0.043, "step": 284000 }, { "epoch": 13.32, "learning_rate": 1.117563496151985e-06, "loss": 0.0411, "step": 284500 }, { "epoch": 13.35, "learning_rate": 1.1019528871821291e-06, "loss": 0.0394, "step": 285000 }, { "epoch": 13.37, "learning_rate": 1.0863422782122732e-06, "loss": 0.0393, "step": 285500 }, { "epoch": 13.39, "learning_rate": 1.0707316692424172e-06, "loss": 0.039, "step": 286000 }, { "epoch": 13.42, "learning_rate": 1.0551210602725612e-06, "loss": 0.0373, "step": 286500 }, { "epoch": 13.44, "learning_rate": 1.0395104513027055e-06, "loss": 0.0412, "step": 287000 }, { "epoch": 13.46, "learning_rate": 1.0238998423328496e-06, "loss": 0.04, "step": 287500 }, { "epoch": 13.49, "learning_rate": 1.0082892333629936e-06, "loss": 0.0402, "step": 288000 }, { "epoch": 13.51, "learning_rate": 9.926786243931376e-07, "loss": 0.0373, "step": 288500 }, { "epoch": 13.53, "learning_rate": 9.770680154232817e-07, "loss": 0.0406, "step": 289000 }, { "epoch": 13.56, "learning_rate": 9.61457406453426e-07, "loss": 0.0399, "step": 289500 }, { "epoch": 13.58, "learning_rate": 9.458467974835699e-07, "loss": 0.0421, "step": 290000 }, { "epoch": 13.6, "learning_rate": 9.30236188513714e-07, "loss": 0.0371, "step": 290500 }, { "epoch": 13.63, "learning_rate": 9.146255795438582e-07, "loss": 0.0379, "step": 291000 }, { "epoch": 13.65, "learning_rate": 8.990149705740021e-07, "loss": 0.0359, "step": 291500 }, { "epoch": 13.67, "learning_rate": 8.834043616041463e-07, "loss": 0.0429, "step": 292000 }, { "epoch": 13.7, "learning_rate": 8.677937526342903e-07, "loss": 0.039, "step": 292500 }, { "epoch": 13.72, "learning_rate": 8.521831436644344e-07, "loss": 0.0384, "step": 293000 }, { "epoch": 13.75, "learning_rate": 8.365725346945785e-07, "loss": 0.0385, "step": 293500 }, { "epoch": 13.77, "learning_rate": 8.209619257247226e-07, "loss": 0.0389, "step": 294000 }, { "epoch": 13.79, "learning_rate": 8.053513167548667e-07, "loss": 0.0383, "step": 294500 }, { "epoch": 13.82, "learning_rate": 7.897407077850107e-07, "loss": 0.0403, "step": 295000 }, { "epoch": 13.84, "learning_rate": 7.741300988151548e-07, "loss": 0.0395, "step": 295500 }, { "epoch": 13.86, "learning_rate": 7.58519489845299e-07, "loss": 0.038, "step": 296000 }, { "epoch": 13.89, "learning_rate": 7.42908880875443e-07, "loss": 0.0394, "step": 296500 }, { "epoch": 13.91, "learning_rate": 7.272982719055872e-07, "loss": 0.0386, "step": 297000 }, { "epoch": 13.93, "learning_rate": 7.116876629357312e-07, "loss": 0.0446, "step": 297500 }, { "epoch": 13.96, "learning_rate": 6.960770539658752e-07, "loss": 0.0418, "step": 298000 }, { "epoch": 13.98, "learning_rate": 6.804664449960194e-07, "loss": 0.0386, "step": 298500 }, { "epoch": 14.0, "eval_AerospaceManufacturer_f1": 0.8680555555555555, "eval_AerospaceManufacturer_number": 138, "eval_AerospaceManufacturer_precision": 0.8333333333333334, "eval_AerospaceManufacturer_recall": 0.9057971014492754, "eval_AnatomicalStructure_f1": 0.7447698744769874, "eval_AnatomicalStructure_number": 227, "eval_AnatomicalStructure_precision": 0.7091633466135459, "eval_AnatomicalStructure_recall": 0.7841409691629956, "eval_ArtWork_f1": 0.625, "eval_ArtWork_number": 131, "eval_ArtWork_precision": 0.6028368794326241, "eval_ArtWork_recall": 0.648854961832061, "eval_Artist_f1": 0.7997721446881231, "eval_Artist_number": 1722, "eval_Artist_precision": 0.7847959754052544, "eval_Artist_recall": 0.8153310104529616, "eval_Athlete_f1": 0.7647058823529412, "eval_Athlete_number": 719, "eval_Athlete_precision": 0.770098730606488, "eval_Athlete_recall": 0.7593880389429764, "eval_CarManufacturer_f1": 0.8292682926829269, "eval_CarManufacturer_number": 159, "eval_CarManufacturer_precision": 0.8047337278106509, "eval_CarManufacturer_recall": 0.8553459119496856, "eval_Cleric_f1": 0.6243654822335025, "eval_Cleric_number": 201, "eval_Cleric_precision": 0.6373056994818653, "eval_Cleric_recall": 0.6119402985074627, "eval_Clothing_f1": 0.6415094339622641, "eval_Clothing_number": 128, "eval_Clothing_precision": 0.6204379562043796, "eval_Clothing_recall": 0.6640625, "eval_Disease_f1": 0.6977886977886978, "eval_Disease_number": 198, "eval_Disease_precision": 0.6794258373205742, "eval_Disease_recall": 0.7171717171717171, "eval_Drink_f1": 0.8013937282229965, "eval_Drink_number": 143, "eval_Drink_precision": 0.7986111111111112, "eval_Drink_recall": 0.8041958041958042, "eval_Facility_f1": 0.6993275696445725, "eval_Facility_number": 497, "eval_Facility_precision": 0.6691176470588235, "eval_Facility_recall": 0.7323943661971831, "eval_Food_f1": 0.7058823529411764, "eval_Food_number": 214, "eval_Food_precision": 0.7109004739336493, "eval_Food_recall": 0.7009345794392523, "eval_HumanSettlement_f1": 0.8727698157355952, "eval_HumanSettlement_number": 1689, "eval_HumanSettlement_precision": 0.8624277456647399, "eval_HumanSettlement_recall": 0.8833629366489046, "eval_MedicalProcedure_f1": 0.7642857142857142, "eval_MedicalProcedure_number": 142, "eval_MedicalProcedure_precision": 0.7753623188405797, "eval_MedicalProcedure_recall": 0.7535211267605634, "eval_Medication/Vaccine_f1": 0.8019323671497584, "eval_Medication/Vaccine_number": 200, "eval_Medication/Vaccine_precision": 0.7757009345794392, "eval_Medication/Vaccine_recall": 0.83, "eval_MusicalGRP_f1": 0.7884362680683311, "eval_MusicalGRP_number": 372, "eval_MusicalGRP_precision": 0.7712082262210797, "eval_MusicalGRP_recall": 0.8064516129032258, "eval_MusicalWork_f1": 0.7667887667887667, "eval_MusicalWork_number": 407, "eval_MusicalWork_precision": 0.7621359223300971, "eval_MusicalWork_recall": 0.7714987714987716, "eval_ORG_f1": 0.6925898752751284, "eval_ORG_number": 667, "eval_ORG_precision": 0.6781609195402298, "eval_ORG_recall": 0.7076461769115442, "eval_OtherLOC_f1": 0.755656108597285, "eval_OtherLOC_number": 224, "eval_OtherLOC_precision": 0.7660550458715596, "eval_OtherLOC_recall": 0.7455357142857143, "eval_OtherPER_f1": 0.5540386803185438, "eval_OtherPER_number": 859, "eval_OtherPER_precision": 0.5417130144605117, "eval_OtherPER_recall": 0.5669383003492433, "eval_OtherPROD_f1": 0.6461187214611873, "eval_OtherPROD_number": 433, "eval_OtherPROD_precision": 0.6388261851015802, "eval_OtherPROD_recall": 0.6535796766743649, "eval_Politician_f1": 0.6139767054908486, "eval_Politician_number": 603, "eval_Politician_precision": 0.6160267111853088, "eval_Politician_recall": 0.6119402985074627, "eval_PrivateCorp_f1": 0.8101265822784809, "eval_PrivateCorp_number": 129, "eval_PrivateCorp_precision": 0.8888888888888888, "eval_PrivateCorp_recall": 0.7441860465116279, "eval_PublicCorp_f1": 0.7580645161290323, "eval_PublicCorp_number": 243, "eval_PublicCorp_precision": 0.7430830039525692, "eval_PublicCorp_recall": 0.7736625514403292, "eval_Scientist_f1": 0.5204081632653063, "eval_Scientist_number": 189, "eval_Scientist_precision": 0.5024630541871922, "eval_Scientist_recall": 0.5396825396825397, "eval_Software_f1": 0.7915309446254072, "eval_Software_number": 307, "eval_Software_precision": 0.7915309446254072, "eval_Software_recall": 0.7915309446254072, "eval_SportsGRP_f1": 0.8761174968071519, "eval_SportsGRP_number": 385, "eval_SportsGRP_precision": 0.8618090452261307, "eval_SportsGRP_recall": 0.8909090909090909, "eval_SportsManager_f1": 0.6900000000000001, "eval_SportsManager_number": 194, "eval_SportsManager_precision": 0.6699029126213593, "eval_SportsManager_recall": 0.711340206185567, "eval_Station_f1": 0.7849999999999999, "eval_Station_number": 194, "eval_Station_precision": 0.7621359223300971, "eval_Station_recall": 0.8092783505154639, "eval_Symptom_f1": 0.744360902255639, "eval_Symptom_number": 129, "eval_Symptom_precision": 0.7226277372262774, "eval_Symptom_recall": 0.7674418604651163, "eval_Vehicle_f1": 0.6651162790697674, "eval_Vehicle_number": 206, "eval_Vehicle_precision": 0.6383928571428571, "eval_Vehicle_recall": 0.6941747572815534, "eval_VisualWork_f1": 0.8016997167138811, "eval_VisualWork_number": 693, "eval_VisualWork_precision": 0.7872044506258693, "eval_VisualWork_recall": 0.8167388167388168, "eval_WrittenWork_f1": 0.7184466019417476, "eval_WrittenWork_number": 563, "eval_WrittenWork_precision": 0.7140350877192982, "eval_WrittenWork_recall": 0.7229129662522202, "eval_loss": 0.32683783769607544, "eval_overall_accuracy": 0.9434713888273031, "eval_overall_f1": 0.7469745753302987, "eval_overall_precision": 0.7357830271216098, "eval_overall_recall": 0.758511837655017, "eval_runtime": 43.8843, "eval_samples_per_second": 202.692, "eval_steps_per_second": 25.339, "step": 298942 }, { "epoch": 14.0, "learning_rate": 6.648558360261633e-07, "loss": 0.0375, "step": 299000 }, { "epoch": 14.03, "learning_rate": 6.492452270563075e-07, "loss": 0.0379, "step": 299500 }, { "epoch": 14.05, "learning_rate": 6.336346180864516e-07, "loss": 0.0334, "step": 300000 }, { "epoch": 14.07, "learning_rate": 6.180240091165957e-07, "loss": 0.0428, "step": 300500 }, { "epoch": 14.1, "learning_rate": 6.024134001467398e-07, "loss": 0.0341, "step": 301000 }, { "epoch": 14.12, "learning_rate": 5.868027911768839e-07, "loss": 0.0309, "step": 301500 }, { "epoch": 14.14, "learning_rate": 5.711921822070279e-07, "loss": 0.0383, "step": 302000 }, { "epoch": 14.17, "learning_rate": 5.55581573237172e-07, "loss": 0.0385, "step": 302500 }, { "epoch": 14.19, "learning_rate": 5.399709642673161e-07, "loss": 0.0375, "step": 303000 }, { "epoch": 14.21, "learning_rate": 5.243603552974602e-07, "loss": 0.0356, "step": 303500 }, { "epoch": 14.24, "learning_rate": 5.087497463276043e-07, "loss": 0.0377, "step": 304000 }, { "epoch": 14.26, "learning_rate": 4.931391373577484e-07, "loss": 0.0376, "step": 304500 }, { "epoch": 14.28, "learning_rate": 4.775285283878924e-07, "loss": 0.0356, "step": 305000 }, { "epoch": 14.31, "learning_rate": 4.6191791941803656e-07, "loss": 0.037, "step": 305500 }, { "epoch": 14.33, "learning_rate": 4.463073104481806e-07, "loss": 0.0359, "step": 306000 }, { "epoch": 14.35, "learning_rate": 4.306967014783247e-07, "loss": 0.0332, "step": 306500 }, { "epoch": 14.38, "learning_rate": 4.1508609250846875e-07, "loss": 0.0359, "step": 307000 }, { "epoch": 14.4, "learning_rate": 3.994754835386129e-07, "loss": 0.0375, "step": 307500 }, { "epoch": 14.42, "learning_rate": 3.8386487456875694e-07, "loss": 0.0377, "step": 308000 }, { "epoch": 14.45, "learning_rate": 3.6825426559890104e-07, "loss": 0.0372, "step": 308500 }, { "epoch": 14.47, "learning_rate": 3.526436566290451e-07, "loss": 0.0346, "step": 309000 }, { "epoch": 14.49, "learning_rate": 3.3703304765918924e-07, "loss": 0.0351, "step": 309500 }, { "epoch": 14.52, "learning_rate": 3.2142243868933334e-07, "loss": 0.0385, "step": 310000 }, { "epoch": 14.54, "learning_rate": 3.058118297194774e-07, "loss": 0.0389, "step": 310500 }, { "epoch": 14.56, "learning_rate": 2.9020122074962143e-07, "loss": 0.0325, "step": 311000 }, { "epoch": 14.59, "learning_rate": 2.745906117797656e-07, "loss": 0.037, "step": 311500 }, { "epoch": 14.61, "learning_rate": 2.589800028099096e-07, "loss": 0.0397, "step": 312000 }, { "epoch": 14.63, "learning_rate": 2.433693938400537e-07, "loss": 0.0382, "step": 312500 }, { "epoch": 14.66, "learning_rate": 2.277587848701978e-07, "loss": 0.0328, "step": 313000 }, { "epoch": 14.68, "learning_rate": 2.121481759003419e-07, "loss": 0.0346, "step": 313500 }, { "epoch": 14.71, "learning_rate": 1.9653756693048597e-07, "loss": 0.0375, "step": 314000 }, { "epoch": 14.73, "learning_rate": 1.8092695796063006e-07, "loss": 0.0377, "step": 314500 }, { "epoch": 14.75, "learning_rate": 1.6531634899077414e-07, "loss": 0.0338, "step": 315000 }, { "epoch": 14.78, "learning_rate": 1.4970574002091823e-07, "loss": 0.0407, "step": 315500 }, { "epoch": 14.8, "learning_rate": 1.340951310510623e-07, "loss": 0.0321, "step": 316000 }, { "epoch": 14.82, "learning_rate": 1.184845220812064e-07, "loss": 0.04, "step": 316500 }, { "epoch": 14.85, "learning_rate": 1.0287391311135049e-07, "loss": 0.0396, "step": 317000 }, { "epoch": 14.87, "learning_rate": 8.726330414149456e-08, "loss": 0.0348, "step": 317500 }, { "epoch": 14.89, "learning_rate": 7.165269517163866e-08, "loss": 0.0405, "step": 318000 }, { "epoch": 14.92, "learning_rate": 5.604208620178273e-08, "loss": 0.0362, "step": 318500 }, { "epoch": 14.94, "learning_rate": 4.0431477231926816e-08, "loss": 0.0371, "step": 319000 }, { "epoch": 14.96, "learning_rate": 2.4820868262070904e-08, "loss": 0.0337, "step": 319500 }, { "epoch": 14.99, "learning_rate": 9.21025929221499e-09, "loss": 0.037, "step": 320000 }, { "epoch": 15.0, "eval_AerospaceManufacturer_f1": 0.8561643835616438, "eval_AerospaceManufacturer_number": 138, "eval_AerospaceManufacturer_precision": 0.8116883116883117, "eval_AerospaceManufacturer_recall": 0.9057971014492754, "eval_AnatomicalStructure_f1": 0.7505241090146751, "eval_AnatomicalStructure_number": 227, "eval_AnatomicalStructure_precision": 0.716, "eval_AnatomicalStructure_recall": 0.788546255506608, "eval_ArtWork_f1": 0.625, "eval_ArtWork_number": 131, "eval_ArtWork_precision": 0.6028368794326241, "eval_ArtWork_recall": 0.648854961832061, "eval_Artist_f1": 0.803960396039604, "eval_Artist_number": 1722, "eval_Artist_precision": 0.7837837837837838, "eval_Artist_recall": 0.8252032520325203, "eval_Athlete_f1": 0.7691218130311614, "eval_Athlete_number": 719, "eval_Athlete_precision": 0.7835497835497836, "eval_Athlete_recall": 0.7552155771905424, "eval_CarManufacturer_f1": 0.8242424242424242, "eval_CarManufacturer_number": 159, "eval_CarManufacturer_precision": 0.7953216374269005, "eval_CarManufacturer_recall": 0.8553459119496856, "eval_Cleric_f1": 0.6282722513089004, "eval_Cleric_number": 201, "eval_Cleric_precision": 0.6629834254143646, "eval_Cleric_recall": 0.5970149253731343, "eval_Clothing_f1": 0.6463878326996197, "eval_Clothing_number": 128, "eval_Clothing_precision": 0.6296296296296297, "eval_Clothing_recall": 0.6640625, "eval_Disease_f1": 0.7064676616915423, "eval_Disease_number": 198, "eval_Disease_precision": 0.696078431372549, "eval_Disease_recall": 0.7171717171717171, "eval_Drink_f1": 0.8055555555555556, "eval_Drink_number": 143, "eval_Drink_precision": 0.8, "eval_Drink_recall": 0.8111888111888111, "eval_Facility_f1": 0.7069133398247323, "eval_Facility_number": 497, "eval_Facility_precision": 0.6849056603773584, "eval_Facility_recall": 0.7303822937625755, "eval_Food_f1": 0.7105882352941177, "eval_Food_number": 214, "eval_Food_precision": 0.7156398104265402, "eval_Food_recall": 0.705607476635514, "eval_HumanSettlement_f1": 0.8736842105263158, "eval_HumanSettlement_number": 1689, "eval_HumanSettlement_precision": 0.8630849220103987, "eval_HumanSettlement_recall": 0.8845470692717584, "eval_MedicalProcedure_f1": 0.7653429602888087, "eval_MedicalProcedure_number": 142, "eval_MedicalProcedure_precision": 0.7851851851851852, "eval_MedicalProcedure_recall": 0.7464788732394366, "eval_Medication/Vaccine_f1": 0.7980997624703088, "eval_Medication/Vaccine_number": 200, "eval_Medication/Vaccine_precision": 0.7601809954751131, "eval_Medication/Vaccine_recall": 0.84, "eval_MusicalGRP_f1": 0.7838541666666667, "eval_MusicalGRP_number": 372, "eval_MusicalGRP_precision": 0.76010101010101, "eval_MusicalGRP_recall": 0.8091397849462365, "eval_MusicalWork_f1": 0.7560975609756098, "eval_MusicalWork_number": 407, "eval_MusicalWork_precision": 0.7506053268765133, "eval_MusicalWork_recall": 0.7616707616707616, "eval_ORG_f1": 0.7045790251107829, "eval_ORG_number": 667, "eval_ORG_precision": 0.6943231441048034, "eval_ORG_recall": 0.7151424287856072, "eval_OtherLOC_f1": 0.7608200455580867, "eval_OtherLOC_number": 224, "eval_OtherLOC_precision": 0.7767441860465116, "eval_OtherLOC_recall": 0.7455357142857143, "eval_OtherPER_f1": 0.5466970387243736, "eval_OtherPER_number": 859, "eval_OtherPER_precision": 0.5351170568561873, "eval_OtherPER_recall": 0.5587892898719441, "eval_OtherPROD_f1": 0.6482758620689655, "eval_OtherPROD_number": 433, "eval_OtherPROD_precision": 0.6453089244851259, "eval_OtherPROD_recall": 0.651270207852194, "eval_Politician_f1": 0.6214405360134004, "eval_Politician_number": 603, "eval_Politician_precision": 0.6277495769881557, "eval_Politician_recall": 0.615257048092869, "eval_PrivateCorp_f1": 0.8185654008438819, "eval_PrivateCorp_number": 129, "eval_PrivateCorp_precision": 0.8981481481481481, "eval_PrivateCorp_recall": 0.751937984496124, "eval_PublicCorp_f1": 0.7525150905432596, "eval_PublicCorp_number": 243, "eval_PublicCorp_precision": 0.7362204724409449, "eval_PublicCorp_recall": 0.7695473251028807, "eval_Scientist_f1": 0.528497409326425, "eval_Scientist_number": 189, "eval_Scientist_precision": 0.5177664974619289, "eval_Scientist_recall": 0.5396825396825397, "eval_Software_f1": 0.7844408427876823, "eval_Software_number": 307, "eval_Software_precision": 0.7806451612903226, "eval_Software_recall": 0.7882736156351792, "eval_SportsGRP_f1": 0.8894601542416454, "eval_SportsGRP_number": 385, "eval_SportsGRP_precision": 0.8804071246819338, "eval_SportsGRP_recall": 0.8987012987012987, "eval_SportsManager_f1": 0.7035175879396985, "eval_SportsManager_number": 194, "eval_SportsManager_precision": 0.6862745098039216, "eval_SportsManager_recall": 0.7216494845360825, "eval_Station_f1": 0.7889447236180904, "eval_Station_number": 194, "eval_Station_precision": 0.7696078431372549, "eval_Station_recall": 0.8092783505154639, "eval_Symptom_f1": 0.7499999999999999, "eval_Symptom_number": 129, "eval_Symptom_precision": 0.7333333333333333, "eval_Symptom_recall": 0.7674418604651163, "eval_Vehicle_f1": 0.6697892271662763, "eval_Vehicle_number": 206, "eval_Vehicle_precision": 0.6470588235294118, "eval_Vehicle_recall": 0.6941747572815534, "eval_VisualWork_f1": 0.8067940552016986, "eval_VisualWork_number": 693, "eval_VisualWork_precision": 0.7916666666666666, "eval_VisualWork_recall": 0.8225108225108225, "eval_WrittenWork_f1": 0.7241992882562278, "eval_WrittenWork_number": 563, "eval_WrittenWork_precision": 0.7254901960784313, "eval_WrittenWork_recall": 0.7229129662522202, "eval_loss": 0.330758273601532, "eval_overall_accuracy": 0.9436644901053475, "eval_overall_f1": 0.7500649037570004, "eval_overall_precision": 0.7403719431834822, "eval_overall_recall": 0.7600150319428787, "eval_runtime": 44.2122, "eval_samples_per_second": 201.189, "eval_steps_per_second": 25.151, "step": 320295 }, { "epoch": 15.0, "step": 320295, "total_flos": 6.580397404702666e+16, "train_loss": 0.11691759577826058, "train_runtime": 70734.3148, "train_samples_per_second": 36.225, "train_steps_per_second": 4.528 } ], "max_steps": 320295, "num_train_epochs": 15, "total_flos": 6.580397404702666e+16, "trial_name": null, "trial_params": null }