{ "best_metric": 0.8100333518621456, "best_model_checkpoint": "tinybert-TG-HS-HX-parentpretrained\\run-9\\checkpoint-1182", "epoch": 7.0, "eval_steps": 500, "global_step": 1379, "is_hyper_param_search": true, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 1.0, "learning_rate": 1.1884492449582221e-05, "loss": 0.3771, "step": 197 }, { "epoch": 1.0, "eval_accuracy": 0.7761256253474152, "eval_loss": 0.35103824734687805, "eval_runtime": 125.0972, "eval_samples_per_second": 57.523, "eval_steps_per_second": 0.456, "step": 197 }, { "epoch": 2.0, "learning_rate": 1.0186707813927618e-05, "loss": 0.356, "step": 394 }, { "epoch": 2.0, "eval_accuracy": 0.7898832684824902, "eval_loss": 0.3439778685569763, "eval_runtime": 125.0439, "eval_samples_per_second": 57.548, "eval_steps_per_second": 0.456, "step": 394 }, { "epoch": 3.0, "learning_rate": 8.488923178273016e-06, "loss": 0.3473, "step": 591 }, { "epoch": 3.0, "eval_accuracy": 0.797526403557532, "eval_loss": 0.34075456857681274, "eval_runtime": 125.2215, "eval_samples_per_second": 57.466, "eval_steps_per_second": 0.455, "step": 591 }, { "epoch": 4.0, "learning_rate": 6.791138542618412e-06, "loss": 0.3428, "step": 788 }, { "epoch": 4.0, "eval_accuracy": 0.8030850472484714, "eval_loss": 0.33721399307250977, "eval_runtime": 124.8586, "eval_samples_per_second": 57.633, "eval_steps_per_second": 0.457, "step": 788 }, { "epoch": 5.0, "learning_rate": 5.093353906963809e-06, "loss": 0.3391, "step": 985 }, { "epoch": 5.0, "eval_accuracy": 0.8060033351862146, "eval_loss": 0.33657532930374146, "eval_runtime": 125.0566, "eval_samples_per_second": 57.542, "eval_steps_per_second": 0.456, "step": 985 }, { "epoch": 6.0, "learning_rate": 3.395569271309206e-06, "loss": 0.3354, "step": 1182 }, { "epoch": 6.0, "eval_accuracy": 0.8100333518621456, "eval_loss": 0.33524009585380554, "eval_runtime": 124.7339, "eval_samples_per_second": 57.691, "eval_steps_per_second": 0.457, "step": 1182 }, { "epoch": 7.0, "learning_rate": 1.697784635654603e-06, "loss": 0.3337, "step": 1379 }, { "epoch": 7.0, "eval_accuracy": 0.8090605892162313, "eval_loss": 0.33525848388671875, "eval_runtime": 125.0522, "eval_samples_per_second": 57.544, "eval_steps_per_second": 0.456, "step": 1379 } ], "logging_steps": 500, "max_steps": 1576, "num_input_tokens_seen": 0, "num_train_epochs": 8, "save_steps": 500, "total_flos": 309665393535204.0, "trial_name": null, "trial_params": { "alpha": 0.625656755680376, "learning_rate": 1.3582277085236825e-05, "num_train_epochs": 8, "temperature": 10 } }