|
{ |
|
"best_metric": null, |
|
"best_model_checkpoint": null, |
|
"epoch": 9.0, |
|
"eval_steps": 500, |
|
"global_step": 729, |
|
"is_hyper_param_search": false, |
|
"is_local_process_zero": true, |
|
"is_world_process_zero": true, |
|
"log_history": [ |
|
{ |
|
"epoch": 1.0, |
|
"eval_Claim": { |
|
"f1-score": 0.5254768748366867, |
|
"precision": 0.5768789443488239, |
|
"recall": 0.4824856046065259, |
|
"support": 4168.0 |
|
}, |
|
"eval_MajorClaim": { |
|
"f1-score": 0.7984361424847959, |
|
"precision": 0.7495921696574225, |
|
"recall": 0.854089219330855, |
|
"support": 2152.0 |
|
}, |
|
"eval_O": { |
|
"f1-score": 0.9990277532260916, |
|
"precision": 0.9988511841640155, |
|
"recall": 0.9992043847241867, |
|
"support": 11312.0 |
|
}, |
|
"eval_Premise": { |
|
"f1-score": 0.8854183656825966, |
|
"precision": 0.8719781543651113, |
|
"recall": 0.8992793837488611, |
|
"support": 12073.0 |
|
}, |
|
"eval_accuracy": 0.8755765022723447, |
|
"eval_loss": 0.28303390741348267, |
|
"eval_macro avg": { |
|
"f1-score": 0.8020897840575427, |
|
"precision": 0.7993251131338432, |
|
"recall": 0.8087646481026072, |
|
"support": 29705.0 |
|
}, |
|
"eval_runtime": 4.8106, |
|
"eval_samples_per_second": 16.63, |
|
"eval_steps_per_second": 2.079, |
|
"eval_weighted avg": { |
|
"f1-score": 0.8718761173649596, |
|
"precision": 0.8700202202343714, |
|
"recall": 0.8755765022723447, |
|
"support": 29705.0 |
|
}, |
|
"step": 81 |
|
}, |
|
{ |
|
"epoch": 2.0, |
|
"eval_Claim": { |
|
"f1-score": 0.5578782336033447, |
|
"precision": 0.6124497991967871, |
|
"recall": 0.5122360844529751, |
|
"support": 4168.0 |
|
}, |
|
"eval_MajorClaim": { |
|
"f1-score": 0.784421283598464, |
|
"precision": 0.9571619812583668, |
|
"recall": 0.6644981412639405, |
|
"support": 2152.0 |
|
}, |
|
"eval_O": { |
|
"f1-score": 0.9998674150351351, |
|
"precision": 0.9997348652231551, |
|
"recall": 1.0, |
|
"support": 11312.0 |
|
}, |
|
"eval_Premise": { |
|
"f1-score": 0.8977749872463995, |
|
"precision": 0.8530201342281879, |
|
"recall": 0.9474861260664292, |
|
"support": 12073.0 |
|
}, |
|
"eval_accuracy": 0.8859114627167144, |
|
"eval_loss": 0.27363118529319763, |
|
"eval_macro avg": { |
|
"f1-score": 0.8099854798708358, |
|
"precision": 0.8555916949766242, |
|
"recall": 0.7810550879458362, |
|
"support": 29705.0 |
|
}, |
|
"eval_runtime": 4.7727, |
|
"eval_samples_per_second": 16.762, |
|
"eval_steps_per_second": 2.095, |
|
"eval_weighted avg": { |
|
"f1-score": 0.8807489883812781, |
|
"precision": 0.8826802296805741, |
|
"recall": 0.8859114627167144, |
|
"support": 29705.0 |
|
}, |
|
"step": 162 |
|
}, |
|
{ |
|
"epoch": 3.0, |
|
"eval_Claim": { |
|
"f1-score": 0.64760736196319, |
|
"precision": 0.6627322953289804, |
|
"recall": 0.6331573896353166, |
|
"support": 4168.0 |
|
}, |
|
"eval_MajorClaim": { |
|
"f1-score": 0.9016018306636155, |
|
"precision": 0.8881875563570785, |
|
"recall": 0.9154275092936803, |
|
"support": 2152.0 |
|
}, |
|
"eval_O": { |
|
"f1-score": 0.9996904982977407, |
|
"precision": 1.0, |
|
"recall": 0.9993811881188119, |
|
"support": 11312.0 |
|
}, |
|
"eval_Premise": { |
|
"f1-score": 0.8982820417748115, |
|
"precision": 0.8936065573770492, |
|
"recall": 0.9030067091857865, |
|
"support": 12073.0 |
|
}, |
|
"eval_accuracy": 0.9027436458508669, |
|
"eval_loss": 0.22585685551166534, |
|
"eval_macro avg": { |
|
"f1-score": 0.8617954331748394, |
|
"precision": 0.861131602265777, |
|
"recall": 0.8627431990583988, |
|
"support": 29705.0 |
|
}, |
|
"eval_runtime": 4.8003, |
|
"eval_samples_per_second": 16.666, |
|
"eval_steps_per_second": 2.083, |
|
"eval_weighted avg": { |
|
"f1-score": 0.9019670975035187, |
|
"precision": 0.9013351218793044, |
|
"recall": 0.9027436458508669, |
|
"support": 29705.0 |
|
}, |
|
"step": 243 |
|
}, |
|
{ |
|
"epoch": 4.0, |
|
"eval_Claim": { |
|
"f1-score": 0.6477602966229081, |
|
"precision": 0.5561865427637239, |
|
"recall": 0.7754318618042226, |
|
"support": 4168.0 |
|
}, |
|
"eval_MajorClaim": { |
|
"f1-score": 0.8984409799554566, |
|
"precision": 0.8627031650983746, |
|
"recall": 0.9372676579925651, |
|
"support": 2152.0 |
|
}, |
|
"eval_O": { |
|
"f1-score": 1.0, |
|
"precision": 1.0, |
|
"recall": 1.0, |
|
"support": 11312.0 |
|
}, |
|
"eval_Premise": { |
|
"f1-score": 0.861495720750997, |
|
"precision": 0.9384029675907849, |
|
"recall": 0.7962395427814131, |
|
"support": 12073.0 |
|
}, |
|
"eval_accuracy": 0.8811311227066151, |
|
"eval_loss": 0.32341843843460083, |
|
"eval_macro avg": { |
|
"f1-score": 0.8519242493323405, |
|
"precision": 0.8393231688632209, |
|
"recall": 0.8772347656445502, |
|
"support": 29705.0 |
|
}, |
|
"eval_runtime": 4.7708, |
|
"eval_samples_per_second": 16.769, |
|
"eval_steps_per_second": 2.096, |
|
"eval_weighted avg": { |
|
"f1-score": 0.8869263673393438, |
|
"precision": 0.9027457246003854, |
|
"recall": 0.8811311227066151, |
|
"support": 29705.0 |
|
}, |
|
"step": 324 |
|
}, |
|
{ |
|
"epoch": 5.0, |
|
"eval_Claim": { |
|
"f1-score": 0.6188788236838649, |
|
"precision": 0.6833864888373442, |
|
"recall": 0.5654990403071017, |
|
"support": 4168.0 |
|
}, |
|
"eval_MajorClaim": { |
|
"f1-score": 0.909733679000707, |
|
"precision": 0.9230033476805356, |
|
"recall": 0.8968401486988847, |
|
"support": 2152.0 |
|
}, |
|
"eval_O": { |
|
"f1-score": 0.9999558011049724, |
|
"precision": 0.9999116061168567, |
|
"recall": 1.0, |
|
"support": 11312.0 |
|
}, |
|
"eval_Premise": { |
|
"f1-score": 0.8978936810431294, |
|
"precision": 0.8706816059757236, |
|
"recall": 0.9268615919821088, |
|
"support": 12073.0 |
|
}, |
|
"eval_accuracy": 0.9018347079616226, |
|
"eval_loss": 0.3072384297847748, |
|
"eval_macro avg": { |
|
"f1-score": 0.8566154962081685, |
|
"precision": 0.8692457621526151, |
|
"recall": 0.8473001952470238, |
|
"support": 29705.0 |
|
}, |
|
"eval_runtime": 4.7922, |
|
"eval_samples_per_second": 16.694, |
|
"eval_steps_per_second": 2.087, |
|
"eval_weighted avg": { |
|
"f1-score": 0.8984684143294738, |
|
"precision": 0.8974043833368577, |
|
"recall": 0.9018347079616226, |
|
"support": 29705.0 |
|
}, |
|
"step": 405 |
|
}, |
|
{ |
|
"epoch": 6.0, |
|
"eval_Claim": { |
|
"f1-score": 0.620837537840565, |
|
"precision": 0.6545212765957447, |
|
"recall": 0.5904510556621881, |
|
"support": 4168.0 |
|
}, |
|
"eval_MajorClaim": { |
|
"f1-score": 0.8993613741466637, |
|
"precision": 0.8547509418166597, |
|
"recall": 0.9488847583643123, |
|
"support": 2152.0 |
|
}, |
|
"eval_O": { |
|
"f1-score": 0.9999558011049724, |
|
"precision": 0.9999116061168567, |
|
"recall": 1.0, |
|
"support": 11312.0 |
|
}, |
|
"eval_Premise": { |
|
"f1-score": 0.8931567692054615, |
|
"precision": 0.8869558114841134, |
|
"recall": 0.8994450426571688, |
|
"support": 12073.0 |
|
}, |
|
"eval_accuracy": 0.8979633058407676, |
|
"eval_loss": 0.3634909987449646, |
|
"eval_macro avg": { |
|
"f1-score": 0.8533278705744156, |
|
"precision": 0.8490349090033436, |
|
"recall": 0.8596952141709173, |
|
"support": 29705.0 |
|
}, |
|
"eval_runtime": 4.7765, |
|
"eval_samples_per_second": 16.749, |
|
"eval_steps_per_second": 2.094, |
|
"eval_weighted avg": { |
|
"f1-score": 0.8960665959131486, |
|
"precision": 0.8950239457358053, |
|
"recall": 0.8979633058407676, |
|
"support": 29705.0 |
|
}, |
|
"step": 486 |
|
}, |
|
{ |
|
"epoch": 6.17, |
|
"grad_norm": 9.48759651184082, |
|
"learning_rate": 1.7530864197530865e-05, |
|
"loss": 0.214, |
|
"step": 500 |
|
}, |
|
{ |
|
"epoch": 7.0, |
|
"eval_Claim": { |
|
"f1-score": 0.6812872467222885, |
|
"precision": 0.6769303647560397, |
|
"recall": 0.685700575815739, |
|
"support": 4168.0 |
|
}, |
|
"eval_MajorClaim": { |
|
"f1-score": 0.9276377217553688, |
|
"precision": 0.9319887429643527, |
|
"recall": 0.9233271375464684, |
|
"support": 2152.0 |
|
}, |
|
"eval_O": { |
|
"f1-score": 0.9999115983026874, |
|
"precision": 0.9999115983026874, |
|
"recall": 0.9999115983026874, |
|
"support": 11312.0 |
|
}, |
|
"eval_Premise": { |
|
"f1-score": 0.9017086927670869, |
|
"precision": 0.9029819752471135, |
|
"recall": 0.9004389961070156, |
|
"support": 12073.0 |
|
}, |
|
"eval_accuracy": 0.9098468271334792, |
|
"eval_loss": 0.3468942642211914, |
|
"eval_macro avg": { |
|
"f1-score": 0.8776363148868579, |
|
"precision": 0.8779531703175483, |
|
"recall": 0.8773445769429775, |
|
"support": 29705.0 |
|
}, |
|
"eval_runtime": 4.7913, |
|
"eval_samples_per_second": 16.697, |
|
"eval_steps_per_second": 2.087, |
|
"eval_weighted avg": { |
|
"f1-score": 0.9100559053806798, |
|
"precision": 0.910277290769933, |
|
"recall": 0.9098468271334792, |
|
"support": 29705.0 |
|
}, |
|
"step": 567 |
|
}, |
|
{ |
|
"epoch": 8.0, |
|
"eval_Claim": { |
|
"f1-score": 0.6928905033731187, |
|
"precision": 0.6105725260654838, |
|
"recall": 0.8008637236084453, |
|
"support": 4168.0 |
|
}, |
|
"eval_MajorClaim": { |
|
"f1-score": 0.9302433371958285, |
|
"precision": 0.9278779472954231, |
|
"recall": 0.9326208178438662, |
|
"support": 2152.0 |
|
}, |
|
"eval_O": { |
|
"f1-score": 0.9999115904871364, |
|
"precision": 1.0, |
|
"recall": 0.9998231966053748, |
|
"support": 11312.0 |
|
}, |
|
"eval_Premise": { |
|
"f1-score": 0.8820387074174622, |
|
"precision": 0.9356247097073851, |
|
"recall": 0.8342582622380519, |
|
"support": 12073.0 |
|
}, |
|
"eval_accuracy": 0.8997475172529877, |
|
"eval_loss": 0.40174800157546997, |
|
"eval_macro avg": { |
|
"f1-score": 0.8762710346183864, |
|
"precision": 0.868518795767073, |
|
"recall": 0.8918915000739345, |
|
"support": 29705.0 |
|
}, |
|
"eval_runtime": 4.7722, |
|
"eval_samples_per_second": 16.764, |
|
"eval_steps_per_second": 2.095, |
|
"eval_weighted avg": { |
|
"f1-score": 0.9038782866839282, |
|
"precision": 0.9139692560686062, |
|
"recall": 0.8997475172529877, |
|
"support": 29705.0 |
|
}, |
|
"step": 648 |
|
}, |
|
{ |
|
"epoch": 9.0, |
|
"eval_Claim": { |
|
"f1-score": 0.6602241979126401, |
|
"precision": 0.7130531589201224, |
|
"recall": 0.6146833013435701, |
|
"support": 4168.0 |
|
}, |
|
"eval_MajorClaim": { |
|
"f1-score": 0.9052154195011338, |
|
"precision": 0.8839681133746679, |
|
"recall": 0.9275092936802974, |
|
"support": 2152.0 |
|
}, |
|
"eval_O": { |
|
"f1-score": 0.9999558011049724, |
|
"precision": 0.9999116061168567, |
|
"recall": 1.0, |
|
"support": 11312.0 |
|
}, |
|
"eval_Premise": { |
|
"f1-score": 0.9072885349800925, |
|
"precision": 0.8903596204449405, |
|
"recall": 0.9248736850824153, |
|
"support": 12073.0 |
|
}, |
|
"eval_accuracy": 0.910149806429894, |
|
"eval_loss": 0.4713464379310608, |
|
"eval_macro avg": { |
|
"f1-score": 0.8681709883747097, |
|
"precision": 0.8718231247141469, |
|
"recall": 0.8667665700265708, |
|
"support": 29705.0 |
|
}, |
|
"eval_runtime": 4.7731, |
|
"eval_samples_per_second": 16.761, |
|
"eval_steps_per_second": 2.095, |
|
"eval_weighted avg": { |
|
"f1-score": 0.9077607320175198, |
|
"precision": 0.9067368029754924, |
|
"recall": 0.910149806429894, |
|
"support": 29705.0 |
|
}, |
|
"step": 729 |
|
} |
|
], |
|
"logging_steps": 500, |
|
"max_steps": 4050, |
|
"num_input_tokens_seen": 0, |
|
"num_train_epochs": 50, |
|
"save_steps": 500, |
|
"total_flos": 1294098594541200.0, |
|
"train_batch_size": 4, |
|
"trial_name": null, |
|
"trial_params": null |
|
} |
|
|