{ "best_metric": 0.2527652680873871, "best_model_checkpoint": "longformer-sep_tok/checkpoint-324", "epoch": 6.0, "eval_steps": 500, "global_step": 486, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 1.0, "eval_Claim": { "f1-score": 0.580553004795429, "precision": 0.5136306192453511, "recall": 0.6675269826372595, "support": 4262.0 }, "eval_MajorClaim": { "f1-score": 0.6929252383341696, "precision": 0.7583745194947831, "recall": 0.6378752886836028, "support": 2165.0 }, "eval_O": { "f1-score": 0.9968272281511393, "precision": 0.9967861557478368, "recall": 0.996868303939344, "support": 12134.0 }, "eval_Premise": { "f1-score": 0.8769487750556793, "precision": 0.9107806691449815, "recall": 0.8455403021704119, "support": 13039.0 }, "eval_accuracy": 0.8654113924050633, "eval_loss": 0.32089120149612427, "eval_macro avg": { "f1-score": 0.7868135615841043, "precision": 0.7948929909082382, "recall": 0.7869527193576545, "support": 31600.0 }, "eval_runtime": 5.9486, "eval_samples_per_second": 13.449, "eval_steps_per_second": 1.681, "eval_weighted avg": { "f1-score": 0.8703967313850799, "precision": 0.8797989523023909, "recall": 0.8654113924050633, "support": 31600.0 }, "step": 81 }, { "epoch": 2.0, "eval_Claim": { "f1-score": 0.6029902384776968, "precision": 0.6369094231271208, "recall": 0.5725011731581418, "support": 4262.0 }, "eval_MajorClaim": { "f1-score": 0.8179940325912326, "precision": 0.8129562043795621, "recall": 0.8230946882217091, "support": 2165.0 }, "eval_O": { "f1-score": 0.9984359565360553, "precision": 0.9972866304884065, "recall": 0.9995879347288611, "support": 12134.0 }, "eval_Premise": { "f1-score": 0.9017917895214335, "precision": 0.8891539321654864, "recall": 0.9147940793005599, "support": 13039.0 }, "eval_accuracy": 0.8949050632911393, "eval_loss": 0.25671303272247314, "eval_macro avg": { "f1-score": 0.8303030042816045, "precision": 0.8340765475401439, "recall": 0.8274944688523179, "support": 31600.0 }, "eval_runtime": 5.97, "eval_samples_per_second": 13.4, "eval_steps_per_second": 1.675, "eval_weighted avg": { "f1-score": 0.8928603328205832, "precision": 0.8914339316361279, "recall": 0.8949050632911393, "support": 31600.0 }, "step": 162 }, { "epoch": 3.0, "eval_Claim": { "f1-score": 0.6010706092276319, "precision": 0.6579241071428571, "recall": 0.5532613796339747, "support": 4262.0 }, "eval_MajorClaim": { "f1-score": 0.8101840181497353, "precision": 0.8917869034406215, "recall": 0.7422632794457275, "support": 2165.0 }, "eval_O": { "f1-score": 0.997983456109305, "precision": 0.9967118783394986, "recall": 0.9992582825119499, "support": 12134.0 }, "eval_Premise": { "f1-score": 0.9085203780271707, "precision": 0.8758630507509432, "recall": 0.9437073395199018, "support": 13039.0 }, "eval_accuracy": 0.8985759493670886, "eval_loss": 0.2674676775932312, "eval_macro avg": { "f1-score": 0.8294396153784607, "precision": 0.8555714849184801, "recall": 0.8096225702778885, "support": 31600.0 }, "eval_runtime": 6.0212, "eval_samples_per_second": 13.286, "eval_steps_per_second": 1.661, "eval_weighted avg": { "f1-score": 0.894668981055346, "precision": 0.8939642861109123, "recall": 0.8985759493670886, "support": 31600.0 }, "step": 243 }, { "epoch": 4.0, "eval_Claim": { "f1-score": 0.66, "precision": 0.6399294843543412, "recall": 0.681370248709526, "support": 4262.0 }, "eval_MajorClaim": { "f1-score": 0.8682903759754079, "precision": 0.8895348837209303, "recall": 0.8480369515011548, "support": 2165.0 }, "eval_O": { "f1-score": 0.9983125488743466, "precision": 0.9971224204554797, "recall": 0.9995055216746332, "support": 12134.0 }, "eval_Premise": { "f1-score": 0.9011362757980985, "precision": 0.9082976236852357, "recall": 0.8940869698596519, "support": 13039.0 }, "eval_accuracy": 0.9027215189873418, "eval_loss": 0.2527652680873871, "eval_macro avg": { "f1-score": 0.8569348001619632, "precision": 0.8587211030539967, "recall": 0.8557499229362415, "support": 31600.0 }, "eval_runtime": 5.9641, "eval_samples_per_second": 13.414, "eval_steps_per_second": 1.677, "eval_weighted avg": { "f1-score": 0.9036775010177053, "precision": 0.9049240079307782, "recall": 0.9027215189873418, "support": 31600.0 }, "step": 324 }, { "epoch": 5.0, "eval_Claim": { "f1-score": 0.6614122219822932, "precision": 0.6126, "recall": 0.7186766776161426, "support": 4262.0 }, "eval_MajorClaim": { "f1-score": 0.805946376426865, "precision": 0.947565543071161, "recall": 0.7011547344110854, "support": 2165.0 }, "eval_O": { "f1-score": 0.998518030627367, "precision": 0.9975324888962, "recall": 0.9995055216746332, "support": 12134.0 }, "eval_Premise": { "f1-score": 0.9051354379999227, "precision": 0.9121495327102803, "recall": 0.8982283917478334, "support": 13039.0 }, "eval_accuracy": 0.8993987341772152, "eval_loss": 0.29903507232666016, "eval_macro avg": { "f1-score": 0.842753016759112, "precision": 0.8674618911694103, "recall": 0.8293913313624237, "support": 31600.0 }, "eval_runtime": 5.9489, "eval_samples_per_second": 13.448, "eval_steps_per_second": 1.681, "eval_weighted avg": { "f1-score": 0.9013256821128531, "precision": 0.9069606828488892, "recall": 0.8993987341772152, "support": 31600.0 }, "step": 405 }, { "epoch": 6.0, "eval_Claim": { "f1-score": 0.6276952563488261, "precision": 0.6412139011257953, "recall": 0.6147348662599719, "support": 4262.0 }, "eval_MajorClaim": { "f1-score": 0.8774834437086093, "precision": 0.8991759573436743, "recall": 0.8568129330254042, "support": 2165.0 }, "eval_O": { "f1-score": 0.9990939044481055, "precision": 0.99860036225918, "recall": 0.9995879347288611, "support": 12134.0 }, "eval_Premise": { "f1-score": 0.8991800789553598, "precision": 0.8901916572717024, "recall": 0.9083518674744996, "support": 13039.0 }, "eval_accuracy": 0.900253164556962, "eval_loss": 0.3113674819469452, "eval_macro avg": { "f1-score": 0.8508631708652252, "precision": 0.8572954695000881, "recall": 0.8448719003721842, "support": 31600.0 }, "eval_runtime": 5.9773, "eval_samples_per_second": 13.384, "eval_steps_per_second": 1.673, "eval_weighted avg": { "f1-score": 0.8994431431727875, "precision": 0.8988542850970194, "recall": 0.900253164556962, "support": 31600.0 }, "step": 486 } ], "logging_steps": 500, "max_steps": 1620, "num_input_tokens_seen": 0, "num_train_epochs": 20, "save_steps": 500, "total_flos": 862732396360800.0, "train_batch_size": 4, "trial_name": null, "trial_params": null }