{ "best_metric": 0.9064039408866996, "best_model_checkpoint": "AAmeni/LILT-checkpoints/checkpoint-1600", "epoch": 26.829268292682926, "eval_steps": 200, "global_step": 2200, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 2.4390243902439024, "eval_accuracy": 0.9208400646203554, "eval_f1": 0.8652657601977751, "eval_loss": 0.29326215386390686, "eval_precision": 0.875, "eval_recall": 0.8557457212713936, "eval_runtime": 10.0837, "eval_samples_per_second": 4.165, "eval_steps_per_second": 1.091, "step": 200 }, { "epoch": 4.878048780487805, "eval_accuracy": 0.925686591276252, "eval_f1": 0.8767123287671232, "eval_loss": 0.3650479018688202, "eval_precision": 0.8934010152284264, "eval_recall": 0.8606356968215159, "eval_runtime": 10.3053, "eval_samples_per_second": 4.076, "eval_steps_per_second": 1.067, "step": 400 }, { "epoch": 6.097560975609756, "grad_norm": 15.58462905883789, "learning_rate": 3.989837398373984e-05, "loss": 0.3014, "step": 500 }, { "epoch": 7.317073170731708, "eval_accuracy": 0.938610662358643, "eval_f1": 0.8976572133168927, "eval_loss": 0.382191926240921, "eval_precision": 0.9054726368159204, "eval_recall": 0.8899755501222494, "eval_runtime": 9.3762, "eval_samples_per_second": 4.479, "eval_steps_per_second": 1.173, "step": 600 }, { "epoch": 9.75609756097561, "eval_accuracy": 0.938610662358643, "eval_f1": 0.8902589395807645, "eval_loss": 0.4051755368709564, "eval_precision": 0.8980099502487562, "eval_recall": 0.882640586797066, "eval_runtime": 8.2706, "eval_samples_per_second": 5.078, "eval_steps_per_second": 1.33, "step": 800 }, { "epoch": 12.195121951219512, "grad_norm": 0.035131603479385376, "learning_rate": 2.973577235772358e-05, "loss": 0.0365, "step": 1000 }, { "epoch": 12.195121951219512, "eval_accuracy": 0.938610662358643, "eval_f1": 0.8932515337423313, "eval_loss": 0.4668120741844177, "eval_precision": 0.896551724137931, "eval_recall": 0.8899755501222494, "eval_runtime": 10.5119, "eval_samples_per_second": 3.995, "eval_steps_per_second": 1.046, "step": 1000 }, { "epoch": 14.634146341463415, "eval_accuracy": 0.9434571890145396, "eval_f1": 0.9009900990099009, "eval_loss": 0.46639078855514526, "eval_precision": 0.9122807017543859, "eval_recall": 0.8899755501222494, "eval_runtime": 9.1524, "eval_samples_per_second": 4.589, "eval_steps_per_second": 1.202, "step": 1200 }, { "epoch": 17.073170731707318, "eval_accuracy": 0.9369951534733441, "eval_f1": 0.8888888888888887, "eval_loss": 0.4993242025375366, "eval_precision": 0.8977556109725686, "eval_recall": 0.8801955990220048, "eval_runtime": 8.3567, "eval_samples_per_second": 5.026, "eval_steps_per_second": 1.316, "step": 1400 }, { "epoch": 18.29268292682927, "grad_norm": 0.003389735473319888, "learning_rate": 1.957317073170732e-05, "loss": 0.0091, "step": 1500 }, { "epoch": 19.51219512195122, "eval_accuracy": 0.9466882067851373, "eval_f1": 0.9064039408866996, "eval_loss": 0.47225338220596313, "eval_precision": 0.913151364764268, "eval_recall": 0.8997555012224939, "eval_runtime": 9.4714, "eval_samples_per_second": 4.434, "eval_steps_per_second": 1.161, "step": 1600 }, { "epoch": 21.951219512195124, "eval_accuracy": 0.9466882067851373, "eval_f1": 0.905521472392638, "eval_loss": 0.4826250672340393, "eval_precision": 0.9088669950738916, "eval_recall": 0.902200488997555, "eval_runtime": 9.1048, "eval_samples_per_second": 4.613, "eval_steps_per_second": 1.208, "step": 1800 }, { "epoch": 24.390243902439025, "grad_norm": 0.0026210923679172993, "learning_rate": 9.410569105691056e-06, "loss": 0.0004, "step": 2000 }, { "epoch": 24.390243902439025, "eval_accuracy": 0.9466882067851373, "eval_f1": 0.9041769041769042, "eval_loss": 0.4790293276309967, "eval_precision": 0.908641975308642, "eval_recall": 0.8997555012224939, "eval_runtime": 8.7609, "eval_samples_per_second": 4.794, "eval_steps_per_second": 1.256, "step": 2000 }, { "epoch": 26.829268292682926, "eval_accuracy": 0.9466882067851373, "eval_f1": 0.9041769041769042, "eval_loss": 0.48069363832473755, "eval_precision": 0.908641975308642, "eval_recall": 0.8997555012224939, "eval_runtime": 8.8195, "eval_samples_per_second": 4.762, "eval_steps_per_second": 1.247, "step": 2200 } ], "logging_steps": 500, "max_steps": 2460, "num_input_tokens_seen": 0, "num_train_epochs": 30, "save_steps": 200, "stateful_callbacks": { "TrainerControl": { "args": { "should_epoch_stop": false, "should_evaluate": false, "should_log": false, "should_save": true, "should_training_stop": false }, "attributes": {} } }, "total_flos": 1223905878835200.0, "train_batch_size": 2, "trial_name": null, "trial_params": null }