{ "best_metric": 0.7445255474452556, "best_model_checkpoint": "outputs/indobert-base-p1-twitter-indonesia-sarcastic/checkpoint-472", "epoch": 11.0, "eval_steps": 500, "global_step": 649, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 1.0, "learning_rate": 9.997532801828659e-06, "loss": 0.5101, "step": 59 }, { "epoch": 1.0, "eval_accuracy": 0.7835820895522388, "eval_f1": 0.608108108108108, "eval_loss": 0.4220750629901886, "eval_precision": 0.5555555555555556, "eval_recall": 0.6716417910447762, "eval_runtime": 1.0673, "eval_samples_per_second": 251.108, "eval_steps_per_second": 4.685, "step": 59 }, { "epoch": 2.0, "learning_rate": 9.990133642141359e-06, "loss": 0.3508, "step": 118 }, { "epoch": 2.0, "eval_accuracy": 0.8246268656716418, "eval_f1": 0.6713286713286712, "eval_loss": 0.34792423248291016, "eval_precision": 0.631578947368421, "eval_recall": 0.7164179104477612, "eval_runtime": 1.0685, "eval_samples_per_second": 250.816, "eval_steps_per_second": 4.679, "step": 118 }, { "epoch": 3.0, "learning_rate": 9.9778098230154e-06, "loss": 0.221, "step": 177 }, { "epoch": 3.0, "eval_accuracy": 0.8582089552238806, "eval_f1": 0.6935483870967741, "eval_loss": 0.3511403799057007, "eval_precision": 0.7543859649122807, "eval_recall": 0.6417910447761194, "eval_runtime": 1.0653, "eval_samples_per_second": 251.58, "eval_steps_per_second": 4.694, "step": 177 }, { "epoch": 4.0, "learning_rate": 9.960573506572391e-06, "loss": 0.1157, "step": 236 }, { "epoch": 4.0, "eval_accuracy": 0.8395522388059702, "eval_f1": 0.6861313868613139, "eval_loss": 0.4352029263973236, "eval_precision": 0.6714285714285714, "eval_recall": 0.7014925373134329, "eval_runtime": 1.0649, "eval_samples_per_second": 251.673, "eval_steps_per_second": 4.695, "step": 236 }, { "epoch": 5.0, "learning_rate": 9.938441702975689e-06, "loss": 0.0453, "step": 295 }, { "epoch": 5.0, "eval_accuracy": 0.8582089552238806, "eval_f1": 0.7076923076923077, "eval_loss": 0.6923192739486694, "eval_precision": 0.7301587301587301, "eval_recall": 0.6865671641791045, "eval_runtime": 1.064, "eval_samples_per_second": 251.881, "eval_steps_per_second": 4.699, "step": 295 }, { "epoch": 6.0, "learning_rate": 9.911436253643445e-06, "loss": 0.0192, "step": 354 }, { "epoch": 6.0, "eval_accuracy": 0.8694029850746269, "eval_f1": 0.7286821705426356, "eval_loss": 0.7378106117248535, "eval_precision": 0.7580645161290323, "eval_recall": 0.7014925373134329, "eval_runtime": 1.0705, "eval_samples_per_second": 250.361, "eval_steps_per_second": 4.671, "step": 354 }, { "epoch": 7.0, "learning_rate": 9.880163895209396e-06, "loss": 0.0159, "step": 413 }, { "epoch": 7.0, "eval_accuracy": 0.8544776119402985, "eval_f1": 0.6722689075630253, "eval_loss": 0.8860062956809998, "eval_precision": 0.7692307692307693, "eval_recall": 0.5970149253731343, "eval_runtime": 1.0639, "eval_samples_per_second": 251.895, "eval_steps_per_second": 4.7, "step": 413 }, { "epoch": 8.0, "learning_rate": 9.843577222724305e-06, "loss": 0.0165, "step": 472 }, { "epoch": 8.0, "eval_accuracy": 0.8694029850746269, "eval_f1": 0.7445255474452556, "eval_loss": 0.8260650634765625, "eval_precision": 0.7285714285714285, "eval_recall": 0.7611940298507462, "eval_runtime": 1.0763, "eval_samples_per_second": 249.008, "eval_steps_per_second": 4.646, "step": 472 }, { "epoch": 9.0, "learning_rate": 9.80221052429255e-06, "loss": 0.0175, "step": 531 }, { "epoch": 9.0, "eval_accuracy": 0.8731343283582089, "eval_f1": 0.7424242424242424, "eval_loss": 0.8732029795646667, "eval_precision": 0.7538461538461538, "eval_recall": 0.7313432835820896, "eval_runtime": 1.0644, "eval_samples_per_second": 251.793, "eval_steps_per_second": 4.698, "step": 531 }, { "epoch": 10.0, "learning_rate": 9.756104623851222e-06, "loss": 0.0062, "step": 590 }, { "epoch": 10.0, "eval_accuracy": 0.8656716417910447, "eval_f1": 0.7272727272727273, "eval_loss": 0.9647775888442993, "eval_precision": 0.7384615384615385, "eval_recall": 0.7164179104477612, "eval_runtime": 1.0637, "eval_samples_per_second": 251.945, "eval_steps_per_second": 4.7, "step": 590 }, { "epoch": 11.0, "learning_rate": 9.705305022357621e-06, "loss": 0.0003, "step": 649 }, { "epoch": 11.0, "eval_accuracy": 0.8619402985074627, "eval_f1": 0.7175572519083969, "eval_loss": 1.0107759237289429, "eval_precision": 0.734375, "eval_recall": 0.7014925373134329, "eval_runtime": 1.0637, "eval_samples_per_second": 251.951, "eval_steps_per_second": 4.701, "step": 649 }, { "epoch": 11.0, "step": 649, "total_flos": 1358837045406720.0, "train_loss": 0.11986877576079226, "train_runtime": 294.5192, "train_samples_per_second": 637.649, "train_steps_per_second": 20.033 } ], "logging_steps": 500, "max_steps": 5900, "num_input_tokens_seen": 0, "num_train_epochs": 100, "save_steps": 500, "total_flos": 1358837045406720.0, "train_batch_size": 32, "trial_name": null, "trial_params": null }