|
{ |
|
"best_metric": null, |
|
"best_model_checkpoint": null, |
|
"epoch": 13.157894736842104, |
|
"global_step": 500, |
|
"is_hyper_param_search": false, |
|
"is_local_process_zero": true, |
|
"is_world_process_zero": true, |
|
"log_history": [ |
|
{ |
|
"epoch": 1.32, |
|
"eval_accuracy": 0.7606798346348186, |
|
"eval_f1": 0.7277096851718338, |
|
"eval_loss": 0.9062727689743042, |
|
"eval_precision": 0.7006015733456733, |
|
"eval_recall": 0.757, |
|
"eval_runtime": 3.59, |
|
"eval_samples_per_second": 15.042, |
|
"eval_steps_per_second": 1.114, |
|
"step": 50 |
|
}, |
|
{ |
|
"epoch": 2.63, |
|
"eval_accuracy": 0.7967386311437759, |
|
"eval_f1": 0.8242074927953891, |
|
"eval_loss": 0.6386759281158447, |
|
"eval_precision": 0.7929759704251387, |
|
"eval_recall": 0.858, |
|
"eval_runtime": 3.6147, |
|
"eval_samples_per_second": 14.939, |
|
"eval_steps_per_second": 1.107, |
|
"step": 100 |
|
}, |
|
{ |
|
"epoch": 3.95, |
|
"eval_accuracy": 0.825447864033073, |
|
"eval_f1": 0.8485576923076923, |
|
"eval_loss": 0.5691221356391907, |
|
"eval_precision": 0.8171296296296297, |
|
"eval_recall": 0.8825, |
|
"eval_runtime": 3.5957, |
|
"eval_samples_per_second": 15.018, |
|
"eval_steps_per_second": 1.112, |
|
"step": 150 |
|
}, |
|
{ |
|
"epoch": 5.26, |
|
"eval_accuracy": 0.822347266881029, |
|
"eval_f1": 0.8555474629764507, |
|
"eval_loss": 0.5723332166671753, |
|
"eval_precision": 0.831524303916942, |
|
"eval_recall": 0.881, |
|
"eval_runtime": 3.6337, |
|
"eval_samples_per_second": 14.861, |
|
"eval_steps_per_second": 1.101, |
|
"step": 200 |
|
}, |
|
{ |
|
"epoch": 6.58, |
|
"eval_accuracy": 0.8292374827744603, |
|
"eval_f1": 0.8729388942774006, |
|
"eval_loss": 0.5896942019462585, |
|
"eval_precision": 0.847457627118644, |
|
"eval_recall": 0.9, |
|
"eval_runtime": 3.5978, |
|
"eval_samples_per_second": 15.009, |
|
"eval_steps_per_second": 1.112, |
|
"step": 250 |
|
}, |
|
{ |
|
"epoch": 7.89, |
|
"eval_accuracy": 0.8283187873220027, |
|
"eval_f1": 0.874515503875969, |
|
"eval_loss": 0.6122345924377441, |
|
"eval_precision": 0.8482142857142857, |
|
"eval_recall": 0.9025, |
|
"eval_runtime": 3.5423, |
|
"eval_samples_per_second": 15.244, |
|
"eval_steps_per_second": 1.129, |
|
"step": 300 |
|
}, |
|
{ |
|
"epoch": 9.21, |
|
"eval_accuracy": 0.8392282958199357, |
|
"eval_f1": 0.8740884783665532, |
|
"eval_loss": 0.6045289635658264, |
|
"eval_precision": 0.8505203405865658, |
|
"eval_recall": 0.899, |
|
"eval_runtime": 3.5491, |
|
"eval_samples_per_second": 15.215, |
|
"eval_steps_per_second": 1.127, |
|
"step": 350 |
|
}, |
|
{ |
|
"epoch": 10.53, |
|
"eval_accuracy": 0.8446256316031235, |
|
"eval_f1": 0.8851733464470125, |
|
"eval_loss": 0.5662067532539368, |
|
"eval_precision": 0.8708272859216255, |
|
"eval_recall": 0.9, |
|
"eval_runtime": 3.6229, |
|
"eval_samples_per_second": 14.905, |
|
"eval_steps_per_second": 1.104, |
|
"step": 400 |
|
}, |
|
{ |
|
"epoch": 11.84, |
|
"eval_accuracy": 0.843706936150666, |
|
"eval_f1": 0.888943488943489, |
|
"eval_loss": 0.5973214507102966, |
|
"eval_precision": 0.8739130434782608, |
|
"eval_recall": 0.9045, |
|
"eval_runtime": 3.6244, |
|
"eval_samples_per_second": 14.899, |
|
"eval_steps_per_second": 1.104, |
|
"step": 450 |
|
}, |
|
{ |
|
"epoch": 13.16, |
|
"learning_rate": 0.0, |
|
"loss": 0.4305, |
|
"step": 500 |
|
}, |
|
{ |
|
"epoch": 13.16, |
|
"eval_accuracy": 0.843706936150666, |
|
"eval_f1": 0.8903638151425762, |
|
"eval_loss": 0.6187416911125183, |
|
"eval_precision": 0.875725338491296, |
|
"eval_recall": 0.9055, |
|
"eval_runtime": 3.6234, |
|
"eval_samples_per_second": 14.903, |
|
"eval_steps_per_second": 1.104, |
|
"step": 500 |
|
}, |
|
{ |
|
"epoch": 13.16, |
|
"step": 500, |
|
"total_flos": 520356947539968.0, |
|
"train_loss": 0.43045907592773436, |
|
"train_runtime": 334.1747, |
|
"train_samples_per_second": 5.985, |
|
"train_steps_per_second": 1.496 |
|
} |
|
], |
|
"max_steps": 500, |
|
"num_train_epochs": 14, |
|
"total_flos": 520356947539968.0, |
|
"trial_name": null, |
|
"trial_params": null |
|
} |
|
|