{ "best_metric": 12.457650398315174, "best_model_checkpoint": "./checkpoint-300", "epoch": 1.1027522935779817, "global_step": 300, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 0.09, "learning_rate": 2.3000000000000004e-06, "loss": 0.5068, "step": 25 }, { "epoch": 0.18, "learning_rate": 4.800000000000001e-06, "loss": 0.2745, "step": 50 }, { "epoch": 0.28, "learning_rate": 7.3e-06, "loss": 0.2341, "step": 75 }, { "epoch": 0.37, "learning_rate": 9.800000000000001e-06, "loss": 0.2097, "step": 100 }, { "epoch": 0.37, "eval_loss": 0.26155176758766174, "eval_runtime": 6495.4175, "eval_samples_per_second": 0.446, "eval_steps_per_second": 0.056, "eval_wer": 17.6700851570369, "step": 100 }, { "epoch": 0.46, "learning_rate": 8.85e-06, "loss": 0.2161, "step": 125 }, { "epoch": 0.55, "learning_rate": 7.600000000000001e-06, "loss": 0.2043, "step": 150 }, { "epoch": 0.64, "learning_rate": 6.35e-06, "loss": 0.1803, "step": 175 }, { "epoch": 0.73, "learning_rate": 5.150000000000001e-06, "loss": 0.1578, "step": 200 }, { "epoch": 0.73, "eval_loss": 0.21081551909446716, "eval_runtime": 6471.6616, "eval_samples_per_second": 0.447, "eval_steps_per_second": 0.056, "eval_wer": 14.098983609559564, "step": 200 }, { "epoch": 0.83, "learning_rate": 3.900000000000001e-06, "loss": 0.1696, "step": 225 }, { "epoch": 0.92, "learning_rate": 2.6500000000000005e-06, "loss": 0.144, "step": 250 }, { "epoch": 1.01, "learning_rate": 1.4000000000000001e-06, "loss": 0.1274, "step": 275 }, { "epoch": 1.1, "learning_rate": 1.5000000000000002e-07, "loss": 0.0806, "step": 300 }, { "epoch": 1.1, "eval_loss": 0.18695282936096191, "eval_runtime": 6462.2032, "eval_samples_per_second": 0.448, "eval_steps_per_second": 0.056, "eval_wer": 12.457650398315174, "step": 300 }, { "epoch": 1.1, "step": 300, "total_flos": 1.02039599259648e+19, "train_loss": 0.20877531051635742, "train_runtime": 20970.8306, "train_samples_per_second": 0.229, "train_steps_per_second": 0.014 } ], "max_steps": 300, "num_train_epochs": 2, "total_flos": 1.02039599259648e+19, "trial_name": null, "trial_params": null }