LessSexistBERT-edos / trainer_state.json
clincolnoz's picture
correct weights
8fa6cc5
raw
history blame
No virus
3.96 kB
{
"best_metric": null,
"best_model_checkpoint": null,
"epoch": 3.0,
"global_step": 3000,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 0.5,
"learning_rate": 1.6686666666666667e-05,
"loss": 0.4418,
"step": 500
},
{
"epoch": 1.0,
"learning_rate": 1.3353333333333333e-05,
"loss": 0.3253,
"step": 1000
},
{
"epoch": 1.0,
"eval_accuracy": 0.878,
"eval_classification_report": " precision recall f1-score support\n0 0.901961 0.941254 0.921189 3030.000\n1 0.787589 0.680412 0.730088 970.000\naccuracy 0.878000 0.878000 0.878000 0.878\nmacro avg 0.844775 0.810833 0.825639 4000.000\nweighted avg 0.874226 0.878000 0.874847 4000.000",
"eval_confusion_matrix": "[[2852 178]\n [ 310 660]]",
"eval_confusion_matrix_norm": "[[0.94125413 0.05874587]\n [0.31958763 0.68041237]]",
"eval_f1": 0.7300884955752213,
"eval_f1_macro": 0.8256385630330887,
"eval_f1_weighted": 0.8748468477738904,
"eval_loss": 0.3010723888874054,
"eval_runtime": 9.6596,
"eval_samples_per_second": 414.097,
"eval_steps_per_second": 25.881,
"step": 1000
},
{
"epoch": 1.5,
"learning_rate": 1.002e-05,
"loss": 0.2684,
"step": 1500
},
{
"epoch": 2.0,
"learning_rate": 6.6866666666666665e-06,
"loss": 0.2439,
"step": 2000
},
{
"epoch": 2.0,
"eval_accuracy": 0.8865,
"eval_classification_report": " precision recall f1-score support\n0 0.914414 0.937954 0.926035 3030.0000\n1 0.789238 0.725773 0.756176 970.0000\naccuracy 0.886500 0.886500 0.886500 0.8865\nmacro avg 0.851826 0.831863 0.841105 4000.0000\nweighted avg 0.884059 0.886500 0.884844 4000.0000",
"eval_confusion_matrix": "[[2842 188]\n [ 266 704]]",
"eval_confusion_matrix_norm": "[[0.9379538 0.0620462]\n [0.2742268 0.7257732]]",
"eval_f1": 0.7561761546723953,
"eval_f1_macro": 0.84110534680508,
"eval_f1_weighted": 0.8848438807534127,
"eval_loss": 0.3121766746044159,
"eval_runtime": 9.6642,
"eval_samples_per_second": 413.897,
"eval_steps_per_second": 25.869,
"step": 2000
},
{
"epoch": 2.5,
"learning_rate": 3.3600000000000004e-06,
"loss": 0.2023,
"step": 2500
},
{
"epoch": 3.0,
"learning_rate": 2.6666666666666667e-08,
"loss": 0.1962,
"step": 3000
},
{
"epoch": 3.0,
"eval_accuracy": 0.88075,
"eval_classification_report": " precision recall f1-score support\n0 0.920593 0.922112 0.921352 3030.00000\n1 0.755440 0.751546 0.753488 970.00000\naccuracy 0.880750 0.880750 0.880750 0.88075\nmacro avg 0.838017 0.836829 0.837420 4000.00000\nweighted avg 0.880544 0.880750 0.880645 4000.00000",
"eval_confusion_matrix": "[[2794 236]\n [ 241 729]]",
"eval_confusion_matrix_norm": "[[0.92211221 0.07788779]\n [0.24845361 0.75154639]]",
"eval_f1": 0.7534883720930233,
"eval_f1_macro": 0.8374201959393394,
"eval_f1_weighted": 0.8806450852201921,
"eval_loss": 0.3457934856414795,
"eval_runtime": 9.6651,
"eval_samples_per_second": 413.86,
"eval_steps_per_second": 25.866,
"step": 3000
},
{
"epoch": 3.0,
"step": 3000,
"total_flos": 1.262933065728e+16,
"train_loss": 0.27966182454427085,
"train_runtime": 430.7509,
"train_samples_per_second": 111.433,
"train_steps_per_second": 6.965
}
],
"max_steps": 3000,
"num_train_epochs": 3,
"total_flos": 1.262933065728e+16,
"trial_name": null,
"trial_params": null
}