tectonatech's picture
End of training
90aa7db verified
{
"best_metric": 0.8781512605042017,
"best_model_checkpoint": "swin-tiny-patch4-window7-224-fine_tune/checkpoint-167",
"epoch": 19.104477611940297,
"eval_steps": 500,
"global_step": 320,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 0.6,
"learning_rate": 1.5625e-05,
"loss": 5.175,
"step": 10
},
{
"epoch": 0.96,
"eval_accuracy": 0.13445378151260504,
"eval_loss": 4.7966742515563965,
"eval_runtime": 1.6208,
"eval_samples_per_second": 146.838,
"eval_steps_per_second": 4.936,
"step": 16
},
{
"epoch": 1.19,
"learning_rate": 3.125e-05,
"loss": 4.8832,
"step": 20
},
{
"epoch": 1.79,
"learning_rate": 4.6875e-05,
"loss": 4.1158,
"step": 30
},
{
"epoch": 1.97,
"eval_accuracy": 0.38235294117647056,
"eval_loss": 2.997732400894165,
"eval_runtime": 1.6523,
"eval_samples_per_second": 144.038,
"eval_steps_per_second": 4.842,
"step": 33
},
{
"epoch": 2.39,
"learning_rate": 4.8611111111111115e-05,
"loss": 2.8326,
"step": 40
},
{
"epoch": 2.99,
"learning_rate": 4.6875e-05,
"loss": 2.0676,
"step": 50
},
{
"epoch": 2.99,
"eval_accuracy": 0.680672268907563,
"eval_loss": 1.5415246486663818,
"eval_runtime": 1.6113,
"eval_samples_per_second": 147.705,
"eval_steps_per_second": 4.965,
"step": 50
},
{
"epoch": 3.58,
"learning_rate": 4.5138888888888894e-05,
"loss": 1.4395,
"step": 60
},
{
"epoch": 4.0,
"eval_accuracy": 0.8151260504201681,
"eval_loss": 0.9951003193855286,
"eval_runtime": 1.6214,
"eval_samples_per_second": 146.787,
"eval_steps_per_second": 4.934,
"step": 67
},
{
"epoch": 4.18,
"learning_rate": 4.340277777777778e-05,
"loss": 1.2087,
"step": 70
},
{
"epoch": 4.78,
"learning_rate": 4.166666666666667e-05,
"loss": 0.9396,
"step": 80
},
{
"epoch": 4.96,
"eval_accuracy": 0.8277310924369747,
"eval_loss": 0.8235336542129517,
"eval_runtime": 1.616,
"eval_samples_per_second": 147.279,
"eval_steps_per_second": 4.951,
"step": 83
},
{
"epoch": 5.37,
"learning_rate": 3.993055555555556e-05,
"loss": 0.8842,
"step": 90
},
{
"epoch": 5.97,
"learning_rate": 3.8194444444444444e-05,
"loss": 0.7456,
"step": 100
},
{
"epoch": 5.97,
"eval_accuracy": 0.8361344537815126,
"eval_loss": 0.7195001244544983,
"eval_runtime": 1.7613,
"eval_samples_per_second": 135.126,
"eval_steps_per_second": 4.542,
"step": 100
},
{
"epoch": 6.57,
"learning_rate": 3.6458333333333336e-05,
"loss": 0.666,
"step": 110
},
{
"epoch": 6.99,
"eval_accuracy": 0.8613445378151261,
"eval_loss": 0.6406444907188416,
"eval_runtime": 1.8597,
"eval_samples_per_second": 127.977,
"eval_steps_per_second": 4.302,
"step": 117
},
{
"epoch": 7.16,
"learning_rate": 3.472222222222222e-05,
"loss": 0.5804,
"step": 120
},
{
"epoch": 7.76,
"learning_rate": 3.2986111111111115e-05,
"loss": 0.5893,
"step": 130
},
{
"epoch": 8.0,
"eval_accuracy": 0.8739495798319328,
"eval_loss": 0.6045222282409668,
"eval_runtime": 1.892,
"eval_samples_per_second": 125.796,
"eval_steps_per_second": 4.228,
"step": 134
},
{
"epoch": 8.36,
"learning_rate": 3.125e-05,
"loss": 0.4919,
"step": 140
},
{
"epoch": 8.96,
"learning_rate": 2.951388888888889e-05,
"loss": 0.4704,
"step": 150
},
{
"epoch": 8.96,
"eval_accuracy": 0.865546218487395,
"eval_loss": 0.6015978455543518,
"eval_runtime": 1.9839,
"eval_samples_per_second": 119.967,
"eval_steps_per_second": 4.033,
"step": 150
},
{
"epoch": 9.55,
"learning_rate": 2.777777777777778e-05,
"loss": 0.4475,
"step": 160
},
{
"epoch": 9.97,
"eval_accuracy": 0.8781512605042017,
"eval_loss": 0.5957779884338379,
"eval_runtime": 2.0047,
"eval_samples_per_second": 118.723,
"eval_steps_per_second": 3.991,
"step": 167
},
{
"epoch": 10.15,
"learning_rate": 2.604166666666667e-05,
"loss": 0.3907,
"step": 170
},
{
"epoch": 10.75,
"learning_rate": 2.4305555555555558e-05,
"loss": 0.3937,
"step": 180
},
{
"epoch": 10.99,
"eval_accuracy": 0.8781512605042017,
"eval_loss": 0.5855588316917419,
"eval_runtime": 1.9315,
"eval_samples_per_second": 123.218,
"eval_steps_per_second": 4.142,
"step": 184
},
{
"epoch": 11.34,
"learning_rate": 2.2569444444444447e-05,
"loss": 0.3648,
"step": 190
},
{
"epoch": 11.94,
"learning_rate": 2.0833333333333336e-05,
"loss": 0.3327,
"step": 200
},
{
"epoch": 12.0,
"eval_accuracy": 0.8781512605042017,
"eval_loss": 0.576105535030365,
"eval_runtime": 1.9179,
"eval_samples_per_second": 124.091,
"eval_steps_per_second": 4.171,
"step": 201
},
{
"epoch": 12.54,
"learning_rate": 1.9097222222222222e-05,
"loss": 0.3277,
"step": 210
},
{
"epoch": 12.96,
"eval_accuracy": 0.8781512605042017,
"eval_loss": 0.5758181214332581,
"eval_runtime": 1.7928,
"eval_samples_per_second": 132.756,
"eval_steps_per_second": 4.462,
"step": 217
},
{
"epoch": 13.13,
"learning_rate": 1.736111111111111e-05,
"loss": 0.3015,
"step": 220
},
{
"epoch": 13.73,
"learning_rate": 1.5625e-05,
"loss": 0.2928,
"step": 230
},
{
"epoch": 13.97,
"eval_accuracy": 0.8739495798319328,
"eval_loss": 0.5753782391548157,
"eval_runtime": 1.6937,
"eval_samples_per_second": 140.52,
"eval_steps_per_second": 4.723,
"step": 234
},
{
"epoch": 14.33,
"learning_rate": 1.388888888888889e-05,
"loss": 0.3066,
"step": 240
},
{
"epoch": 14.93,
"learning_rate": 1.2152777777777779e-05,
"loss": 0.2545,
"step": 250
},
{
"epoch": 14.99,
"eval_accuracy": 0.8739495798319328,
"eval_loss": 0.5710859298706055,
"eval_runtime": 1.6244,
"eval_samples_per_second": 146.515,
"eval_steps_per_second": 4.925,
"step": 251
},
{
"epoch": 15.52,
"learning_rate": 1.0416666666666668e-05,
"loss": 0.2657,
"step": 260
},
{
"epoch": 16.0,
"eval_accuracy": 0.8739495798319328,
"eval_loss": 0.5850977301597595,
"eval_runtime": 1.6309,
"eval_samples_per_second": 145.929,
"eval_steps_per_second": 4.905,
"step": 268
},
{
"epoch": 16.12,
"learning_rate": 8.680555555555556e-06,
"loss": 0.2504,
"step": 270
},
{
"epoch": 16.72,
"learning_rate": 6.944444444444445e-06,
"loss": 0.2457,
"step": 280
},
{
"epoch": 16.96,
"eval_accuracy": 0.865546218487395,
"eval_loss": 0.5805228352546692,
"eval_runtime": 1.8182,
"eval_samples_per_second": 130.897,
"eval_steps_per_second": 4.4,
"step": 284
},
{
"epoch": 17.31,
"learning_rate": 5.208333333333334e-06,
"loss": 0.2431,
"step": 290
},
{
"epoch": 17.91,
"learning_rate": 3.4722222222222224e-06,
"loss": 0.2359,
"step": 300
},
{
"epoch": 17.97,
"eval_accuracy": 0.8697478991596639,
"eval_loss": 0.576209545135498,
"eval_runtime": 1.6467,
"eval_samples_per_second": 144.532,
"eval_steps_per_second": 4.858,
"step": 301
},
{
"epoch": 18.51,
"learning_rate": 1.7361111111111112e-06,
"loss": 0.2849,
"step": 310
},
{
"epoch": 18.99,
"eval_accuracy": 0.8739495798319328,
"eval_loss": 0.57916259765625,
"eval_runtime": 1.7294,
"eval_samples_per_second": 137.622,
"eval_steps_per_second": 4.626,
"step": 318
},
{
"epoch": 19.1,
"learning_rate": 0.0,
"loss": 0.223,
"step": 320
},
{
"epoch": 19.1,
"eval_accuracy": 0.8739495798319328,
"eval_loss": 0.5791583061218262,
"eval_runtime": 1.6568,
"eval_samples_per_second": 143.653,
"eval_steps_per_second": 4.829,
"step": 320
},
{
"epoch": 19.1,
"step": 320,
"total_flos": 1.0205933497811251e+18,
"train_loss": 1.0078448697924614,
"train_runtime": 686.2446,
"train_samples_per_second": 62.339,
"train_steps_per_second": 0.466
}
],
"logging_steps": 10,
"max_steps": 320,
"num_input_tokens_seen": 0,
"num_train_epochs": 20,
"save_steps": 500,
"total_flos": 1.0205933497811251e+18,
"train_batch_size": 32,
"trial_name": null,
"trial_params": null
}