File size: 1,695 Bytes
1da9e2f 35b1422 1da9e2f 35b1422 1da9e2f 35b1422 1da9e2f 35b1422 1da9e2f 35b1422 1da9e2f 35b1422 1da9e2f 35b1422 1da9e2f 35b1422 1da9e2f 35b1422 1da9e2f 35b1422 1da9e2f 35b1422 1da9e2f 35b1422 1da9e2f 35b1422 1da9e2f 35b1422 1da9e2f |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 |
{
"best_metric": 1.127414345741272,
"best_model_checkpoint": "/kaggle/output/checkpoint-3000",
"epoch": 0.12222946544980444,
"eval_steps": 1000,
"global_step": 3000,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 0.0,
"learning_rate": 2.7777777777777777e-11,
"loss": 1.029,
"step": 1
},
{
"epoch": 0.04,
"learning_rate": 2.7638888888888893e-08,
"loss": 1.181,
"step": 1000
},
{
"epoch": 0.04,
"eval_accuracy": 0.3273453093812375,
"eval_loss": 1.1529844999313354,
"eval_runtime": 54.2837,
"eval_samples_per_second": 92.293,
"eval_steps_per_second": 11.55,
"step": 1000
},
{
"epoch": 0.08,
"learning_rate": 5.541666666666667e-08,
"loss": 1.1527,
"step": 2000
},
{
"epoch": 0.08,
"eval_accuracy": 0.33013972055888224,
"eval_loss": 1.1351025104522705,
"eval_runtime": 54.0518,
"eval_samples_per_second": 92.689,
"eval_steps_per_second": 11.6,
"step": 2000
},
{
"epoch": 0.12,
"learning_rate": 8.316666666666666e-08,
"loss": 1.142,
"step": 3000
},
{
"epoch": 0.12,
"eval_accuracy": 0.3317365269461078,
"eval_loss": 1.127414345741272,
"eval_runtime": 54.0871,
"eval_samples_per_second": 92.628,
"eval_steps_per_second": 11.592,
"step": 3000
}
],
"logging_steps": 1000,
"max_steps": 10000000,
"num_train_epochs": 408,
"save_steps": 1000,
"total_flos": 6271065391104000.0,
"trial_name": null,
"trial_params": null
}
|