|
{ |
|
"best_metric": 0.09445525705814362, |
|
"best_model_checkpoint": "/kaggle/working/checkpoint-48000", |
|
"epoch": 1.9991670137442732, |
|
"global_step": 48000, |
|
"is_hyper_param_search": false, |
|
"is_local_process_zero": true, |
|
"is_world_process_zero": true, |
|
"log_history": [ |
|
{ |
|
"epoch": 0.25, |
|
"learning_rate": 1.750104123281966e-05, |
|
"loss": 0.0319, |
|
"step": 6000 |
|
}, |
|
{ |
|
"epoch": 0.25, |
|
"eval_accuracy": 0.9821939782823297, |
|
"eval_f1": 0.9897475612268823, |
|
"eval_loss": 0.16341181099414825, |
|
"eval_precision": 0.9992109831150386, |
|
"eval_recall": 0.9804617117117117, |
|
"eval_runtime": 789.0185, |
|
"eval_samples_per_second": 102.71, |
|
"eval_steps_per_second": 12.839, |
|
"step": 6000 |
|
}, |
|
{ |
|
"epoch": 0.5, |
|
"learning_rate": 1.5002082465639318e-05, |
|
"loss": 0.0147, |
|
"step": 12000 |
|
}, |
|
{ |
|
"epoch": 0.5, |
|
"eval_accuracy": 0.9766658440276407, |
|
"eval_f1": 0.9865158764680296, |
|
"eval_loss": 0.10613188147544861, |
|
"eval_precision": 0.999638723102935, |
|
"eval_recall": 0.9737331081081081, |
|
"eval_runtime": 793.5025, |
|
"eval_samples_per_second": 102.129, |
|
"eval_steps_per_second": 12.766, |
|
"step": 12000 |
|
}, |
|
{ |
|
"epoch": 0.75, |
|
"learning_rate": 1.2503123698458976e-05, |
|
"loss": 0.0107, |
|
"step": 18000 |
|
}, |
|
{ |
|
"epoch": 0.75, |
|
"eval_accuracy": 0.9957428430404739, |
|
"eval_f1": 0.9975677676336846, |
|
"eval_loss": 0.043012455105781555, |
|
"eval_precision": 0.9992232186992444, |
|
"eval_recall": 0.9959177927927928, |
|
"eval_runtime": 792.2966, |
|
"eval_samples_per_second": 102.285, |
|
"eval_steps_per_second": 12.786, |
|
"step": 18000 |
|
}, |
|
{ |
|
"epoch": 1.0, |
|
"learning_rate": 1.0004164931278636e-05, |
|
"loss": 0.0074, |
|
"step": 24000 |
|
}, |
|
{ |
|
"epoch": 1.0, |
|
"eval_accuracy": 0.9847235932872656, |
|
"eval_f1": 0.9912112564069798, |
|
"eval_loss": 0.09504717588424683, |
|
"eval_precision": 0.9998567786657501, |
|
"eval_recall": 0.9827139639639639, |
|
"eval_runtime": 790.115, |
|
"eval_samples_per_second": 102.567, |
|
"eval_steps_per_second": 12.821, |
|
"step": 24000 |
|
}, |
|
{ |
|
"epoch": 1.25, |
|
"learning_rate": 7.505206164098294e-06, |
|
"loss": 0.0041, |
|
"step": 30000 |
|
}, |
|
{ |
|
"epoch": 1.25, |
|
"eval_accuracy": 0.9903998025666337, |
|
"eval_f1": 0.9944949973819397, |
|
"eval_loss": 0.08727405965328217, |
|
"eval_precision": 0.9998292689867114, |
|
"eval_recall": 0.9892173423423424, |
|
"eval_runtime": 788.7991, |
|
"eval_samples_per_second": 102.738, |
|
"eval_steps_per_second": 12.842, |
|
"step": 30000 |
|
}, |
|
{ |
|
"epoch": 1.5, |
|
"learning_rate": 5.006247396917952e-06, |
|
"loss": 0.0031, |
|
"step": 36000 |
|
}, |
|
{ |
|
"epoch": 1.5, |
|
"eval_accuracy": 0.9819718657453109, |
|
"eval_f1": 0.9896102233695304, |
|
"eval_loss": 0.1629093438386917, |
|
"eval_precision": 1.0, |
|
"eval_recall": 0.9794341216216216, |
|
"eval_runtime": 788.9221, |
|
"eval_samples_per_second": 102.722, |
|
"eval_steps_per_second": 12.84, |
|
"step": 36000 |
|
}, |
|
{ |
|
"epoch": 1.75, |
|
"learning_rate": 2.5072886297376097e-06, |
|
"loss": 0.0022, |
|
"step": 42000 |
|
}, |
|
{ |
|
"epoch": 1.75, |
|
"eval_accuracy": 0.9804540967423495, |
|
"eval_f1": 0.9887258181611126, |
|
"eval_loss": 0.1487206518650055, |
|
"eval_precision": 0.9999856028103314, |
|
"eval_recall": 0.9777167792792792, |
|
"eval_runtime": 791.8683, |
|
"eval_samples_per_second": 102.34, |
|
"eval_steps_per_second": 12.793, |
|
"step": 42000 |
|
}, |
|
{ |
|
"epoch": 2.0, |
|
"learning_rate": 8.329862557267807e-09, |
|
"loss": 0.001, |
|
"step": 48000 |
|
}, |
|
{ |
|
"epoch": 2.0, |
|
"eval_accuracy": 0.9904368213228035, |
|
"eval_f1": 0.9945157204220418, |
|
"eval_loss": 0.09445525705814362, |
|
"eval_precision": 0.9999430791342336, |
|
"eval_recall": 0.9891469594594594, |
|
"eval_runtime": 792.2508, |
|
"eval_samples_per_second": 102.291, |
|
"eval_steps_per_second": 12.786, |
|
"step": 48000 |
|
} |
|
], |
|
"max_steps": 48020, |
|
"num_train_epochs": 2, |
|
"total_flos": 7.687934370520642e+16, |
|
"trial_name": null, |
|
"trial_params": null |
|
} |
|
|