longformer-sep_tok / checkpoint-648 /trainer_state.json
Theoreticallyhugo's picture
Training in progress, epoch 8, checkpoint
608fc35 verified
raw
history blame
11 kB
{
"best_metric": null,
"best_model_checkpoint": null,
"epoch": 8.0,
"eval_steps": 500,
"global_step": 648,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 1.0,
"eval_Claim": {
"f1-score": 0.5254768748366867,
"precision": 0.5768789443488239,
"recall": 0.4824856046065259,
"support": 4168.0
},
"eval_MajorClaim": {
"f1-score": 0.7984361424847959,
"precision": 0.7495921696574225,
"recall": 0.854089219330855,
"support": 2152.0
},
"eval_O": {
"f1-score": 0.9990277532260916,
"precision": 0.9988511841640155,
"recall": 0.9992043847241867,
"support": 11312.0
},
"eval_Premise": {
"f1-score": 0.8854183656825966,
"precision": 0.8719781543651113,
"recall": 0.8992793837488611,
"support": 12073.0
},
"eval_accuracy": 0.8755765022723447,
"eval_loss": 0.28303390741348267,
"eval_macro avg": {
"f1-score": 0.8020897840575427,
"precision": 0.7993251131338432,
"recall": 0.8087646481026072,
"support": 29705.0
},
"eval_runtime": 4.8106,
"eval_samples_per_second": 16.63,
"eval_steps_per_second": 2.079,
"eval_weighted avg": {
"f1-score": 0.8718761173649596,
"precision": 0.8700202202343714,
"recall": 0.8755765022723447,
"support": 29705.0
},
"step": 81
},
{
"epoch": 2.0,
"eval_Claim": {
"f1-score": 0.5578782336033447,
"precision": 0.6124497991967871,
"recall": 0.5122360844529751,
"support": 4168.0
},
"eval_MajorClaim": {
"f1-score": 0.784421283598464,
"precision": 0.9571619812583668,
"recall": 0.6644981412639405,
"support": 2152.0
},
"eval_O": {
"f1-score": 0.9998674150351351,
"precision": 0.9997348652231551,
"recall": 1.0,
"support": 11312.0
},
"eval_Premise": {
"f1-score": 0.8977749872463995,
"precision": 0.8530201342281879,
"recall": 0.9474861260664292,
"support": 12073.0
},
"eval_accuracy": 0.8859114627167144,
"eval_loss": 0.27363118529319763,
"eval_macro avg": {
"f1-score": 0.8099854798708358,
"precision": 0.8555916949766242,
"recall": 0.7810550879458362,
"support": 29705.0
},
"eval_runtime": 4.7727,
"eval_samples_per_second": 16.762,
"eval_steps_per_second": 2.095,
"eval_weighted avg": {
"f1-score": 0.8807489883812781,
"precision": 0.8826802296805741,
"recall": 0.8859114627167144,
"support": 29705.0
},
"step": 162
},
{
"epoch": 3.0,
"eval_Claim": {
"f1-score": 0.64760736196319,
"precision": 0.6627322953289804,
"recall": 0.6331573896353166,
"support": 4168.0
},
"eval_MajorClaim": {
"f1-score": 0.9016018306636155,
"precision": 0.8881875563570785,
"recall": 0.9154275092936803,
"support": 2152.0
},
"eval_O": {
"f1-score": 0.9996904982977407,
"precision": 1.0,
"recall": 0.9993811881188119,
"support": 11312.0
},
"eval_Premise": {
"f1-score": 0.8982820417748115,
"precision": 0.8936065573770492,
"recall": 0.9030067091857865,
"support": 12073.0
},
"eval_accuracy": 0.9027436458508669,
"eval_loss": 0.22585685551166534,
"eval_macro avg": {
"f1-score": 0.8617954331748394,
"precision": 0.861131602265777,
"recall": 0.8627431990583988,
"support": 29705.0
},
"eval_runtime": 4.8003,
"eval_samples_per_second": 16.666,
"eval_steps_per_second": 2.083,
"eval_weighted avg": {
"f1-score": 0.9019670975035187,
"precision": 0.9013351218793044,
"recall": 0.9027436458508669,
"support": 29705.0
},
"step": 243
},
{
"epoch": 4.0,
"eval_Claim": {
"f1-score": 0.6477602966229081,
"precision": 0.5561865427637239,
"recall": 0.7754318618042226,
"support": 4168.0
},
"eval_MajorClaim": {
"f1-score": 0.8984409799554566,
"precision": 0.8627031650983746,
"recall": 0.9372676579925651,
"support": 2152.0
},
"eval_O": {
"f1-score": 1.0,
"precision": 1.0,
"recall": 1.0,
"support": 11312.0
},
"eval_Premise": {
"f1-score": 0.861495720750997,
"precision": 0.9384029675907849,
"recall": 0.7962395427814131,
"support": 12073.0
},
"eval_accuracy": 0.8811311227066151,
"eval_loss": 0.32341843843460083,
"eval_macro avg": {
"f1-score": 0.8519242493323405,
"precision": 0.8393231688632209,
"recall": 0.8772347656445502,
"support": 29705.0
},
"eval_runtime": 4.7708,
"eval_samples_per_second": 16.769,
"eval_steps_per_second": 2.096,
"eval_weighted avg": {
"f1-score": 0.8869263673393438,
"precision": 0.9027457246003854,
"recall": 0.8811311227066151,
"support": 29705.0
},
"step": 324
},
{
"epoch": 5.0,
"eval_Claim": {
"f1-score": 0.6188788236838649,
"precision": 0.6833864888373442,
"recall": 0.5654990403071017,
"support": 4168.0
},
"eval_MajorClaim": {
"f1-score": 0.909733679000707,
"precision": 0.9230033476805356,
"recall": 0.8968401486988847,
"support": 2152.0
},
"eval_O": {
"f1-score": 0.9999558011049724,
"precision": 0.9999116061168567,
"recall": 1.0,
"support": 11312.0
},
"eval_Premise": {
"f1-score": 0.8978936810431294,
"precision": 0.8706816059757236,
"recall": 0.9268615919821088,
"support": 12073.0
},
"eval_accuracy": 0.9018347079616226,
"eval_loss": 0.3072384297847748,
"eval_macro avg": {
"f1-score": 0.8566154962081685,
"precision": 0.8692457621526151,
"recall": 0.8473001952470238,
"support": 29705.0
},
"eval_runtime": 4.7922,
"eval_samples_per_second": 16.694,
"eval_steps_per_second": 2.087,
"eval_weighted avg": {
"f1-score": 0.8984684143294738,
"precision": 0.8974043833368577,
"recall": 0.9018347079616226,
"support": 29705.0
},
"step": 405
},
{
"epoch": 6.0,
"eval_Claim": {
"f1-score": 0.620837537840565,
"precision": 0.6545212765957447,
"recall": 0.5904510556621881,
"support": 4168.0
},
"eval_MajorClaim": {
"f1-score": 0.8993613741466637,
"precision": 0.8547509418166597,
"recall": 0.9488847583643123,
"support": 2152.0
},
"eval_O": {
"f1-score": 0.9999558011049724,
"precision": 0.9999116061168567,
"recall": 1.0,
"support": 11312.0
},
"eval_Premise": {
"f1-score": 0.8931567692054615,
"precision": 0.8869558114841134,
"recall": 0.8994450426571688,
"support": 12073.0
},
"eval_accuracy": 0.8979633058407676,
"eval_loss": 0.3634909987449646,
"eval_macro avg": {
"f1-score": 0.8533278705744156,
"precision": 0.8490349090033436,
"recall": 0.8596952141709173,
"support": 29705.0
},
"eval_runtime": 4.7765,
"eval_samples_per_second": 16.749,
"eval_steps_per_second": 2.094,
"eval_weighted avg": {
"f1-score": 0.8960665959131486,
"precision": 0.8950239457358053,
"recall": 0.8979633058407676,
"support": 29705.0
},
"step": 486
},
{
"epoch": 6.17,
"grad_norm": 9.48759651184082,
"learning_rate": 1.7530864197530865e-05,
"loss": 0.214,
"step": 500
},
{
"epoch": 7.0,
"eval_Claim": {
"f1-score": 0.6812872467222885,
"precision": 0.6769303647560397,
"recall": 0.685700575815739,
"support": 4168.0
},
"eval_MajorClaim": {
"f1-score": 0.9276377217553688,
"precision": 0.9319887429643527,
"recall": 0.9233271375464684,
"support": 2152.0
},
"eval_O": {
"f1-score": 0.9999115983026874,
"precision": 0.9999115983026874,
"recall": 0.9999115983026874,
"support": 11312.0
},
"eval_Premise": {
"f1-score": 0.9017086927670869,
"precision": 0.9029819752471135,
"recall": 0.9004389961070156,
"support": 12073.0
},
"eval_accuracy": 0.9098468271334792,
"eval_loss": 0.3468942642211914,
"eval_macro avg": {
"f1-score": 0.8776363148868579,
"precision": 0.8779531703175483,
"recall": 0.8773445769429775,
"support": 29705.0
},
"eval_runtime": 4.7913,
"eval_samples_per_second": 16.697,
"eval_steps_per_second": 2.087,
"eval_weighted avg": {
"f1-score": 0.9100559053806798,
"precision": 0.910277290769933,
"recall": 0.9098468271334792,
"support": 29705.0
},
"step": 567
},
{
"epoch": 8.0,
"eval_Claim": {
"f1-score": 0.6928905033731187,
"precision": 0.6105725260654838,
"recall": 0.8008637236084453,
"support": 4168.0
},
"eval_MajorClaim": {
"f1-score": 0.9302433371958285,
"precision": 0.9278779472954231,
"recall": 0.9326208178438662,
"support": 2152.0
},
"eval_O": {
"f1-score": 0.9999115904871364,
"precision": 1.0,
"recall": 0.9998231966053748,
"support": 11312.0
},
"eval_Premise": {
"f1-score": 0.8820387074174622,
"precision": 0.9356247097073851,
"recall": 0.8342582622380519,
"support": 12073.0
},
"eval_accuracy": 0.8997475172529877,
"eval_loss": 0.40174800157546997,
"eval_macro avg": {
"f1-score": 0.8762710346183864,
"precision": 0.868518795767073,
"recall": 0.8918915000739345,
"support": 29705.0
},
"eval_runtime": 4.7722,
"eval_samples_per_second": 16.764,
"eval_steps_per_second": 2.095,
"eval_weighted avg": {
"f1-score": 0.9038782866839282,
"precision": 0.9139692560686062,
"recall": 0.8997475172529877,
"support": 29705.0
},
"step": 648
}
],
"logging_steps": 500,
"max_steps": 4050,
"num_input_tokens_seen": 0,
"num_train_epochs": 50,
"save_steps": 500,
"total_flos": 1150309861814400.0,
"train_batch_size": 4,
"trial_name": null,
"trial_params": null
}