{ "best_metric": 0.9135991932046025, "best_model_checkpoint": "../models/eusts/checkpoint-2180", "epoch": 10.0, "global_step": 2180, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 1.0, "learning_rate": 2.8726207906295755e-05, "loss": 1.4053, "step": 218 }, { "epoch": 1.0, "eval_combined_score": 0.8498445305588846, "eval_loss": 0.5913795232772827, "eval_pearson": 0.8576485507627736, "eval_runtime": 10.4654, "eval_samples_per_second": 83.227, "eval_spearmanr": 0.8420405103549957, "eval_steps_per_second": 10.415, "step": 218 }, { "epoch": 2.0, "learning_rate": 2.553440702781845e-05, "loss": 0.3881, "step": 436 }, { "epoch": 2.0, "eval_combined_score": 0.887035736675172, "eval_loss": 0.447421669960022, "eval_pearson": 0.8917341241804541, "eval_runtime": 10.5067, "eval_samples_per_second": 82.899, "eval_spearmanr": 0.8823373491698899, "eval_steps_per_second": 10.374, "step": 436 }, { "epoch": 3.0, "learning_rate": 2.2342606149341143e-05, "loss": 0.2083, "step": 654 }, { "epoch": 3.0, "eval_combined_score": 0.8970108216951012, "eval_loss": 0.4096603989601135, "eval_pearson": 0.9016467997316473, "eval_runtime": 10.4817, "eval_samples_per_second": 83.097, "eval_spearmanr": 0.8923748436585551, "eval_steps_per_second": 10.399, "step": 654 }, { "epoch": 4.0, "learning_rate": 1.9150805270863837e-05, "loss": 0.1393, "step": 872 }, { "epoch": 4.0, "eval_combined_score": 0.9009673665742599, "eval_loss": 0.3968064486980438, "eval_pearson": 0.9046095606853766, "eval_runtime": 10.448, "eval_samples_per_second": 83.366, "eval_spearmanr": 0.8973251724631434, "eval_steps_per_second": 10.433, "step": 872 }, { "epoch": 5.0, "learning_rate": 1.595900439238653e-05, "loss": 0.1023, "step": 1090 }, { "epoch": 5.0, "eval_combined_score": 0.906389648678596, "eval_loss": 0.38093939423561096, "eval_pearson": 0.9095917410726173, "eval_runtime": 10.7338, "eval_samples_per_second": 81.146, "eval_spearmanr": 0.9031875562845746, "eval_steps_per_second": 10.155, "step": 1090 }, { "epoch": 6.0, "learning_rate": 1.2767203513909225e-05, "loss": 0.0841, "step": 1308 }, { "epoch": 6.0, "eval_combined_score": 0.9098955778506463, "eval_loss": 0.37849491834640503, "eval_pearson": 0.9139073667065271, "eval_runtime": 10.6077, "eval_samples_per_second": 82.11, "eval_spearmanr": 0.9058837889947655, "eval_steps_per_second": 10.276, "step": 1308 }, { "epoch": 7.0, "learning_rate": 9.575402635431918e-06, "loss": 0.0664, "step": 1526 }, { "epoch": 7.0, "eval_combined_score": 0.9111955743924036, "eval_loss": 0.35929641127586365, "eval_pearson": 0.9148956072886006, "eval_runtime": 10.7134, "eval_samples_per_second": 81.3, "eval_spearmanr": 0.9074955414962067, "eval_steps_per_second": 10.174, "step": 1526 }, { "epoch": 8.0, "learning_rate": 6.383601756954612e-06, "loss": 0.057, "step": 1744 }, { "epoch": 8.0, "eval_combined_score": 0.9122781067251765, "eval_loss": 0.3573194146156311, "eval_pearson": 0.9160432969800479, "eval_runtime": 10.694, "eval_samples_per_second": 81.448, "eval_spearmanr": 0.9085129164703051, "eval_steps_per_second": 10.193, "step": 1744 }, { "epoch": 9.0, "learning_rate": 3.191800878477306e-06, "loss": 0.0485, "step": 1962 }, { "epoch": 9.0, "eval_combined_score": 0.9128873266818468, "eval_loss": 0.3531445860862732, "eval_pearson": 0.9165594039106797, "eval_runtime": 10.7576, "eval_samples_per_second": 80.966, "eval_spearmanr": 0.9092152494530139, "eval_steps_per_second": 10.132, "step": 1962 }, { "epoch": 10.0, "learning_rate": 0.0, "loss": 0.0449, "step": 2180 }, { "epoch": 10.0, "eval_combined_score": 0.9135991932046025, "eval_loss": 0.3487534821033478, "eval_pearson": 0.917271052630473, "eval_runtime": 10.8295, "eval_samples_per_second": 80.428, "eval_spearmanr": 0.9099273337787319, "eval_steps_per_second": 10.065, "step": 2180 }, { "epoch": 10.0, "step": 2180, "total_flos": 1.834393807540224e+16, "train_loss": 0.2544048738042149, "train_runtime": 2592.0512, "train_samples_per_second": 26.898, "train_steps_per_second": 0.841 } ], "max_steps": 2180, "num_train_epochs": 10, "total_flos": 1.834393807540224e+16, "trial_name": null, "trial_params": null }