|
{ |
|
"best_metric": null, |
|
"best_model_checkpoint": null, |
|
"epoch": 10.0, |
|
"global_step": 910, |
|
"is_hyper_param_search": false, |
|
"is_local_process_zero": true, |
|
"is_world_process_zero": true, |
|
"log_history": [ |
|
{ |
|
"epoch": 1.0, |
|
"eval_accuracy": 0.9533894011551323, |
|
"eval_f1": 0.6969990319457888, |
|
"eval_loss": 0.20486080646514893, |
|
"eval_precision": 0.6617647058823529, |
|
"eval_recall": 0.7361963190184049, |
|
"eval_runtime": 1.2373, |
|
"eval_samples_per_second": 130.123, |
|
"eval_steps_per_second": 33.137, |
|
"step": 91 |
|
}, |
|
{ |
|
"epoch": 1.1, |
|
"learning_rate": 4.4505494505494504e-05, |
|
"loss": 0.5036, |
|
"step": 100 |
|
}, |
|
{ |
|
"epoch": 2.0, |
|
"eval_accuracy": 0.9722362954706657, |
|
"eval_f1": 0.8234146341463414, |
|
"eval_loss": 0.11564752459526062, |
|
"eval_precision": 0.7873134328358209, |
|
"eval_recall": 0.8629856850715747, |
|
"eval_runtime": 1.2367, |
|
"eval_samples_per_second": 130.181, |
|
"eval_steps_per_second": 33.152, |
|
"step": 182 |
|
}, |
|
{ |
|
"epoch": 2.2, |
|
"learning_rate": 3.901098901098901e-05, |
|
"loss": 0.1442, |
|
"step": 200 |
|
}, |
|
{ |
|
"epoch": 3.0, |
|
"eval_accuracy": 0.9771000101327388, |
|
"eval_f1": 0.8632812499999999, |
|
"eval_loss": 0.10779214650392532, |
|
"eval_precision": 0.8261682242990654, |
|
"eval_recall": 0.9038854805725971, |
|
"eval_runtime": 1.2508, |
|
"eval_samples_per_second": 128.715, |
|
"eval_steps_per_second": 32.778, |
|
"step": 273 |
|
}, |
|
{ |
|
"epoch": 3.3, |
|
"learning_rate": 3.3516483516483513e-05, |
|
"loss": 0.0757, |
|
"step": 300 |
|
}, |
|
{ |
|
"epoch": 4.0, |
|
"eval_accuracy": 0.9780119566318776, |
|
"eval_f1": 0.8851148851148851, |
|
"eval_loss": 0.1178947389125824, |
|
"eval_precision": 0.865234375, |
|
"eval_recall": 0.9059304703476483, |
|
"eval_runtime": 1.2453, |
|
"eval_samples_per_second": 129.288, |
|
"eval_steps_per_second": 32.924, |
|
"step": 364 |
|
}, |
|
{ |
|
"epoch": 4.4, |
|
"learning_rate": 2.8021978021978025e-05, |
|
"loss": 0.0526, |
|
"step": 400 |
|
}, |
|
{ |
|
"epoch": 5.0, |
|
"eval_accuracy": 0.9836862904042962, |
|
"eval_f1": 0.897876643073812, |
|
"eval_loss": 0.0906740128993988, |
|
"eval_precision": 0.888, |
|
"eval_recall": 0.9079754601226994, |
|
"eval_runtime": 1.2584, |
|
"eval_samples_per_second": 127.94, |
|
"eval_steps_per_second": 32.581, |
|
"step": 455 |
|
}, |
|
{ |
|
"epoch": 5.49, |
|
"learning_rate": 2.252747252747253e-05, |
|
"loss": 0.0342, |
|
"step": 500 |
|
}, |
|
{ |
|
"epoch": 6.0, |
|
"eval_accuracy": 0.9831796534603303, |
|
"eval_f1": 0.9130869130869131, |
|
"eval_loss": 0.0972292423248291, |
|
"eval_precision": 0.892578125, |
|
"eval_recall": 0.934560327198364, |
|
"eval_runtime": 1.2748, |
|
"eval_samples_per_second": 126.296, |
|
"eval_steps_per_second": 32.162, |
|
"step": 546 |
|
}, |
|
{ |
|
"epoch": 6.59, |
|
"learning_rate": 1.7032967032967035e-05, |
|
"loss": 0.0245, |
|
"step": 600 |
|
}, |
|
{ |
|
"epoch": 7.0, |
|
"eval_accuracy": 0.9833823082379167, |
|
"eval_f1": 0.9107321965897693, |
|
"eval_loss": 0.10643576085567474, |
|
"eval_precision": 0.8937007874015748, |
|
"eval_recall": 0.9284253578732107, |
|
"eval_runtime": 1.2478, |
|
"eval_samples_per_second": 129.031, |
|
"eval_steps_per_second": 32.859, |
|
"step": 637 |
|
}, |
|
{ |
|
"epoch": 7.69, |
|
"learning_rate": 1.153846153846154e-05, |
|
"loss": 0.0188, |
|
"step": 700 |
|
}, |
|
{ |
|
"epoch": 8.0, |
|
"eval_accuracy": 0.9850035464586078, |
|
"eval_f1": 0.9169169169169169, |
|
"eval_loss": 0.09653466939926147, |
|
"eval_precision": 0.8980392156862745, |
|
"eval_recall": 0.9366053169734151, |
|
"eval_runtime": 1.2451, |
|
"eval_samples_per_second": 129.306, |
|
"eval_steps_per_second": 32.929, |
|
"step": 728 |
|
}, |
|
{ |
|
"epoch": 8.79, |
|
"learning_rate": 6.043956043956044e-06, |
|
"loss": 0.0159, |
|
"step": 800 |
|
}, |
|
{ |
|
"epoch": 9.0, |
|
"eval_accuracy": 0.984598236903435, |
|
"eval_f1": 0.9201213346814965, |
|
"eval_loss": 0.09986742585897446, |
|
"eval_precision": 0.91, |
|
"eval_recall": 0.9304703476482618, |
|
"eval_runtime": 1.2461, |
|
"eval_samples_per_second": 129.208, |
|
"eval_steps_per_second": 32.904, |
|
"step": 819 |
|
}, |
|
{ |
|
"epoch": 9.89, |
|
"learning_rate": 5.494505494505495e-07, |
|
"loss": 0.0141, |
|
"step": 900 |
|
}, |
|
{ |
|
"epoch": 10.0, |
|
"eval_accuracy": 0.985104873847401, |
|
"eval_f1": 0.911088911088911, |
|
"eval_loss": 0.09563781321048737, |
|
"eval_precision": 0.890625, |
|
"eval_recall": 0.9325153374233128, |
|
"eval_runtime": 1.2493, |
|
"eval_samples_per_second": 128.877, |
|
"eval_steps_per_second": 32.819, |
|
"step": 910 |
|
}, |
|
{ |
|
"epoch": 10.0, |
|
"step": 910, |
|
"total_flos": 1883034567828480.0, |
|
"train_loss": 0.09724931471295409, |
|
"train_runtime": 322.9196, |
|
"train_samples_per_second": 44.624, |
|
"train_steps_per_second": 2.818 |
|
} |
|
], |
|
"max_steps": 910, |
|
"num_train_epochs": 10, |
|
"total_flos": 1883034567828480.0, |
|
"trial_name": null, |
|
"trial_params": null |
|
} |
|
|