|
{ |
|
"best_metric": null, |
|
"best_model_checkpoint": null, |
|
"epoch": 3.0, |
|
"global_step": 3000, |
|
"is_hyper_param_search": false, |
|
"is_local_process_zero": true, |
|
"is_world_process_zero": true, |
|
"log_history": [ |
|
{ |
|
"epoch": 0.5, |
|
"learning_rate": 1.6686666666666667e-05, |
|
"loss": 0.4418, |
|
"step": 500 |
|
}, |
|
{ |
|
"epoch": 1.0, |
|
"learning_rate": 1.3353333333333333e-05, |
|
"loss": 0.3253, |
|
"step": 1000 |
|
}, |
|
{ |
|
"epoch": 1.0, |
|
"eval_accuracy": 0.878, |
|
"eval_classification_report": " precision recall f1-score support\n0 0.901961 0.941254 0.921189 3030.000\n1 0.787589 0.680412 0.730088 970.000\naccuracy 0.878000 0.878000 0.878000 0.878\nmacro avg 0.844775 0.810833 0.825639 4000.000\nweighted avg 0.874226 0.878000 0.874847 4000.000", |
|
"eval_confusion_matrix": "[[2852 178]\n [ 310 660]]", |
|
"eval_confusion_matrix_norm": "[[0.94125413 0.05874587]\n [0.31958763 0.68041237]]", |
|
"eval_f1": 0.7300884955752213, |
|
"eval_f1_macro": 0.8256385630330887, |
|
"eval_f1_weighted": 0.8748468477738904, |
|
"eval_loss": 0.3010723888874054, |
|
"eval_runtime": 9.6596, |
|
"eval_samples_per_second": 414.097, |
|
"eval_steps_per_second": 25.881, |
|
"step": 1000 |
|
}, |
|
{ |
|
"epoch": 1.5, |
|
"learning_rate": 1.002e-05, |
|
"loss": 0.2684, |
|
"step": 1500 |
|
}, |
|
{ |
|
"epoch": 2.0, |
|
"learning_rate": 6.6866666666666665e-06, |
|
"loss": 0.2439, |
|
"step": 2000 |
|
}, |
|
{ |
|
"epoch": 2.0, |
|
"eval_accuracy": 0.8865, |
|
"eval_classification_report": " precision recall f1-score support\n0 0.914414 0.937954 0.926035 3030.0000\n1 0.789238 0.725773 0.756176 970.0000\naccuracy 0.886500 0.886500 0.886500 0.8865\nmacro avg 0.851826 0.831863 0.841105 4000.0000\nweighted avg 0.884059 0.886500 0.884844 4000.0000", |
|
"eval_confusion_matrix": "[[2842 188]\n [ 266 704]]", |
|
"eval_confusion_matrix_norm": "[[0.9379538 0.0620462]\n [0.2742268 0.7257732]]", |
|
"eval_f1": 0.7561761546723953, |
|
"eval_f1_macro": 0.84110534680508, |
|
"eval_f1_weighted": 0.8848438807534127, |
|
"eval_loss": 0.3121766746044159, |
|
"eval_runtime": 9.6642, |
|
"eval_samples_per_second": 413.897, |
|
"eval_steps_per_second": 25.869, |
|
"step": 2000 |
|
}, |
|
{ |
|
"epoch": 2.5, |
|
"learning_rate": 3.3600000000000004e-06, |
|
"loss": 0.2023, |
|
"step": 2500 |
|
}, |
|
{ |
|
"epoch": 3.0, |
|
"learning_rate": 2.6666666666666667e-08, |
|
"loss": 0.1962, |
|
"step": 3000 |
|
}, |
|
{ |
|
"epoch": 3.0, |
|
"eval_accuracy": 0.88075, |
|
"eval_classification_report": " precision recall f1-score support\n0 0.920593 0.922112 0.921352 3030.00000\n1 0.755440 0.751546 0.753488 970.00000\naccuracy 0.880750 0.880750 0.880750 0.88075\nmacro avg 0.838017 0.836829 0.837420 4000.00000\nweighted avg 0.880544 0.880750 0.880645 4000.00000", |
|
"eval_confusion_matrix": "[[2794 236]\n [ 241 729]]", |
|
"eval_confusion_matrix_norm": "[[0.92211221 0.07788779]\n [0.24845361 0.75154639]]", |
|
"eval_f1": 0.7534883720930233, |
|
"eval_f1_macro": 0.8374201959393394, |
|
"eval_f1_weighted": 0.8806450852201921, |
|
"eval_loss": 0.3457934856414795, |
|
"eval_runtime": 9.6651, |
|
"eval_samples_per_second": 413.86, |
|
"eval_steps_per_second": 25.866, |
|
"step": 3000 |
|
}, |
|
{ |
|
"epoch": 3.0, |
|
"step": 3000, |
|
"total_flos": 1.262933065728e+16, |
|
"train_loss": 0.27966182454427085, |
|
"train_runtime": 430.7509, |
|
"train_samples_per_second": 111.433, |
|
"train_steps_per_second": 6.965 |
|
} |
|
], |
|
"max_steps": 3000, |
|
"num_train_epochs": 3, |
|
"total_flos": 1.262933065728e+16, |
|
"trial_name": null, |
|
"trial_params": null |
|
} |
|
|