longformer-sep_tok / checkpoint-41 /trainer_state.json
Theoreticallyhugo's picture
Training in progress, epoch 1, checkpoint
c432439 verified
raw
history blame
1.77 kB
{
"best_metric": null,
"best_model_checkpoint": null,
"epoch": 1.0,
"eval_steps": 500,
"global_step": 41,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 1.0,
"eval_Claim": {
"f1-score": 0.4643135219309629,
"precision": 0.5337112171837709,
"recall": 0.4108865411116215,
"support": 4354.0
},
"eval_MajorClaim": {
"f1-score": 0.7490950657268052,
"precision": 0.6779310344827586,
"recall": 0.8369518944231588,
"support": 2349.0
},
"eval_O": {
"f1-score": 0.9980494407069782,
"precision": 0.9961064759634486,
"recall": 1.0,
"support": 12536.0
},
"eval_Premise": {
"f1-score": 0.8811786372007365,
"precision": 0.868321718931475,
"recall": 0.8944220128607746,
"support": 13374.0
},
"eval_accuracy": 0.8663109802839358,
"eval_loss": 0.32735684514045715,
"eval_macro avg": {
"f1-score": 0.7731591663913707,
"precision": 0.7690176116403633,
"recall": 0.7855651120988888,
"support": 32613.0
},
"eval_runtime": 1.4205,
"eval_samples_per_second": 57.022,
"eval_steps_per_second": 7.744,
"eval_weighted avg": {
"f1-score": 0.8609350954068932,
"precision": 0.8590551035257559,
"recall": 0.8663109802839358,
"support": 32613.0
},
"step": 41
}
],
"logging_steps": 500,
"max_steps": 656,
"num_input_tokens_seen": 0,
"num_train_epochs": 16,
"save_steps": 500,
"total_flos": 143342183867400.0,
"train_batch_size": 8,
"trial_name": null,
"trial_params": null
}