|
{ |
|
"best_metric": 0.8785714285714286, |
|
"best_model_checkpoint": "Human-Action-Recognition-VIT-Base-patch16-224/checkpoint-316", |
|
"epoch": 19.746835443037973, |
|
"eval_steps": 500, |
|
"global_step": 780, |
|
"is_hyper_param_search": false, |
|
"is_local_process_zero": true, |
|
"is_world_process_zero": true, |
|
"log_history": [ |
|
{ |
|
"epoch": 0.99, |
|
"learning_rate": 2.5e-05, |
|
"loss": 2.6396, |
|
"step": 39 |
|
}, |
|
{ |
|
"epoch": 0.99, |
|
"eval_accuracy": 0.44246031746031744, |
|
"eval_loss": 2.04364275932312, |
|
"eval_runtime": 33.6234, |
|
"eval_samples_per_second": 74.948, |
|
"eval_steps_per_second": 1.19, |
|
"step": 39 |
|
}, |
|
{ |
|
"epoch": 2.0, |
|
"learning_rate": 4.992877492877493e-05, |
|
"loss": 1.4579, |
|
"step": 79 |
|
}, |
|
{ |
|
"epoch": 2.0, |
|
"eval_accuracy": 0.7916666666666666, |
|
"eval_loss": 0.7552899122238159, |
|
"eval_runtime": 33.9732, |
|
"eval_samples_per_second": 74.176, |
|
"eval_steps_per_second": 1.177, |
|
"step": 79 |
|
}, |
|
{ |
|
"epoch": 2.99, |
|
"learning_rate": 4.7150997150997157e-05, |
|
"loss": 0.8342, |
|
"step": 118 |
|
}, |
|
{ |
|
"epoch": 2.99, |
|
"eval_accuracy": 0.8416666666666667, |
|
"eval_loss": 0.5296158194541931, |
|
"eval_runtime": 33.8808, |
|
"eval_samples_per_second": 74.378, |
|
"eval_steps_per_second": 1.181, |
|
"step": 118 |
|
}, |
|
{ |
|
"epoch": 4.0, |
|
"learning_rate": 4.4301994301994304e-05, |
|
"loss": 0.6649, |
|
"step": 158 |
|
}, |
|
{ |
|
"epoch": 4.0, |
|
"eval_accuracy": 0.8496031746031746, |
|
"eval_loss": 0.4977969229221344, |
|
"eval_runtime": 33.6309, |
|
"eval_samples_per_second": 74.931, |
|
"eval_steps_per_second": 1.189, |
|
"step": 158 |
|
}, |
|
{ |
|
"epoch": 4.99, |
|
"learning_rate": 4.152421652421652e-05, |
|
"loss": 0.6137, |
|
"step": 197 |
|
}, |
|
{ |
|
"epoch": 4.99, |
|
"eval_accuracy": 0.8595238095238096, |
|
"eval_loss": 0.44600579142570496, |
|
"eval_runtime": 33.559, |
|
"eval_samples_per_second": 75.092, |
|
"eval_steps_per_second": 1.192, |
|
"step": 197 |
|
}, |
|
{ |
|
"epoch": 6.0, |
|
"learning_rate": 3.867521367521368e-05, |
|
"loss": 0.5374, |
|
"step": 237 |
|
}, |
|
{ |
|
"epoch": 6.0, |
|
"eval_accuracy": 0.8626984126984127, |
|
"eval_loss": 0.43557941913604736, |
|
"eval_runtime": 33.4656, |
|
"eval_samples_per_second": 75.301, |
|
"eval_steps_per_second": 1.195, |
|
"step": 237 |
|
}, |
|
{ |
|
"epoch": 6.99, |
|
"learning_rate": 3.58974358974359e-05, |
|
"loss": 0.514, |
|
"step": 276 |
|
}, |
|
{ |
|
"epoch": 6.99, |
|
"eval_accuracy": 0.8615079365079366, |
|
"eval_loss": 0.4348864257335663, |
|
"eval_runtime": 33.7031, |
|
"eval_samples_per_second": 74.771, |
|
"eval_steps_per_second": 1.187, |
|
"step": 276 |
|
}, |
|
{ |
|
"epoch": 8.0, |
|
"learning_rate": 3.304843304843305e-05, |
|
"loss": 0.475, |
|
"step": 316 |
|
}, |
|
{ |
|
"epoch": 8.0, |
|
"eval_accuracy": 0.8785714285714286, |
|
"eval_loss": 0.4005189836025238, |
|
"eval_runtime": 33.4656, |
|
"eval_samples_per_second": 75.301, |
|
"eval_steps_per_second": 1.195, |
|
"step": 316 |
|
}, |
|
{ |
|
"epoch": 8.99, |
|
"learning_rate": 3.0270655270655275e-05, |
|
"loss": 0.4663, |
|
"step": 355 |
|
}, |
|
{ |
|
"epoch": 8.99, |
|
"eval_accuracy": 0.8658730158730159, |
|
"eval_loss": 0.4163670241832733, |
|
"eval_runtime": 33.7779, |
|
"eval_samples_per_second": 74.605, |
|
"eval_steps_per_second": 1.184, |
|
"step": 355 |
|
}, |
|
{ |
|
"epoch": 10.0, |
|
"learning_rate": 2.7421652421652423e-05, |
|
"loss": 0.4178, |
|
"step": 395 |
|
}, |
|
{ |
|
"epoch": 10.0, |
|
"eval_accuracy": 0.8738095238095238, |
|
"eval_loss": 0.4127999544143677, |
|
"eval_runtime": 33.3961, |
|
"eval_samples_per_second": 75.458, |
|
"eval_steps_per_second": 1.198, |
|
"step": 395 |
|
}, |
|
{ |
|
"epoch": 10.99, |
|
"learning_rate": 2.4643874643874645e-05, |
|
"loss": 0.4226, |
|
"step": 434 |
|
}, |
|
{ |
|
"epoch": 10.99, |
|
"eval_accuracy": 0.8690476190476191, |
|
"eval_loss": 0.4115118980407715, |
|
"eval_runtime": 33.5412, |
|
"eval_samples_per_second": 75.131, |
|
"eval_steps_per_second": 1.193, |
|
"step": 434 |
|
}, |
|
{ |
|
"epoch": 12.0, |
|
"learning_rate": 2.1794871794871795e-05, |
|
"loss": 0.3896, |
|
"step": 474 |
|
}, |
|
{ |
|
"epoch": 12.0, |
|
"eval_accuracy": 0.875, |
|
"eval_loss": 0.4112005829811096, |
|
"eval_runtime": 33.6831, |
|
"eval_samples_per_second": 74.815, |
|
"eval_steps_per_second": 1.188, |
|
"step": 474 |
|
}, |
|
{ |
|
"epoch": 12.99, |
|
"learning_rate": 1.9017094017094017e-05, |
|
"loss": 0.3866, |
|
"step": 513 |
|
}, |
|
{ |
|
"epoch": 12.99, |
|
"eval_accuracy": 0.8714285714285714, |
|
"eval_loss": 0.4072014093399048, |
|
"eval_runtime": 33.7064, |
|
"eval_samples_per_second": 74.763, |
|
"eval_steps_per_second": 1.187, |
|
"step": 513 |
|
}, |
|
{ |
|
"epoch": 14.0, |
|
"learning_rate": 1.6168091168091168e-05, |
|
"loss": 0.3632, |
|
"step": 553 |
|
}, |
|
{ |
|
"epoch": 14.0, |
|
"eval_accuracy": 0.8718253968253968, |
|
"eval_loss": 0.41061681509017944, |
|
"eval_runtime": 33.9136, |
|
"eval_samples_per_second": 74.306, |
|
"eval_steps_per_second": 1.179, |
|
"step": 553 |
|
}, |
|
{ |
|
"epoch": 14.99, |
|
"learning_rate": 1.3390313390313392e-05, |
|
"loss": 0.3596, |
|
"step": 592 |
|
}, |
|
{ |
|
"epoch": 14.99, |
|
"eval_accuracy": 0.8714285714285714, |
|
"eval_loss": 0.4042780101299286, |
|
"eval_runtime": 33.971, |
|
"eval_samples_per_second": 74.181, |
|
"eval_steps_per_second": 1.177, |
|
"step": 592 |
|
}, |
|
{ |
|
"epoch": 16.0, |
|
"learning_rate": 1.0541310541310543e-05, |
|
"loss": 0.3421, |
|
"step": 632 |
|
}, |
|
{ |
|
"epoch": 16.0, |
|
"eval_accuracy": 0.8674603174603175, |
|
"eval_loss": 0.4128040075302124, |
|
"eval_runtime": 33.5678, |
|
"eval_samples_per_second": 75.072, |
|
"eval_steps_per_second": 1.192, |
|
"step": 632 |
|
}, |
|
{ |
|
"epoch": 16.99, |
|
"learning_rate": 7.763532763532765e-06, |
|
"loss": 0.344, |
|
"step": 671 |
|
}, |
|
{ |
|
"epoch": 16.99, |
|
"eval_accuracy": 0.8642857142857143, |
|
"eval_loss": 0.41805535554885864, |
|
"eval_runtime": 33.6623, |
|
"eval_samples_per_second": 74.861, |
|
"eval_steps_per_second": 1.188, |
|
"step": 671 |
|
}, |
|
{ |
|
"epoch": 18.0, |
|
"learning_rate": 4.914529914529915e-06, |
|
"loss": 0.3447, |
|
"step": 711 |
|
}, |
|
{ |
|
"epoch": 18.0, |
|
"eval_accuracy": 0.8686507936507937, |
|
"eval_loss": 0.41281768679618835, |
|
"eval_runtime": 33.9679, |
|
"eval_samples_per_second": 74.188, |
|
"eval_steps_per_second": 1.178, |
|
"step": 711 |
|
}, |
|
{ |
|
"epoch": 18.99, |
|
"learning_rate": 2.136752136752137e-06, |
|
"loss": 0.3407, |
|
"step": 750 |
|
}, |
|
{ |
|
"epoch": 18.99, |
|
"eval_accuracy": 0.8714285714285714, |
|
"eval_loss": 0.40965768694877625, |
|
"eval_runtime": 33.6119, |
|
"eval_samples_per_second": 74.973, |
|
"eval_steps_per_second": 1.19, |
|
"step": 750 |
|
}, |
|
{ |
|
"epoch": 19.75, |
|
"learning_rate": 0.0, |
|
"loss": 0.3267, |
|
"step": 780 |
|
}, |
|
{ |
|
"epoch": 19.75, |
|
"eval_accuracy": 0.8682539682539683, |
|
"eval_loss": 0.40967872738838196, |
|
"eval_runtime": 34.1352, |
|
"eval_samples_per_second": 73.824, |
|
"eval_steps_per_second": 1.172, |
|
"step": 780 |
|
}, |
|
{ |
|
"epoch": 19.75, |
|
"step": 780, |
|
"total_flos": 1.5428282771770638e+19, |
|
"train_loss": 0.6146706715608254, |
|
"train_runtime": 7303.7952, |
|
"train_samples_per_second": 27.602, |
|
"train_steps_per_second": 0.107 |
|
} |
|
], |
|
"logging_steps": 500, |
|
"max_steps": 780, |
|
"num_train_epochs": 20, |
|
"save_steps": 500, |
|
"total_flos": 1.5428282771770638e+19, |
|
"trial_name": null, |
|
"trial_params": null |
|
} |
|
|