|
{ |
|
"best_metric": 0.7894736842105264, |
|
"best_model_checkpoint": "outputs/xlm-roberta-base-twitter-indonesia-sarcastic/checkpoint-590", |
|
"epoch": 13.0, |
|
"eval_steps": 500, |
|
"global_step": 767, |
|
"is_hyper_param_search": false, |
|
"is_local_process_zero": true, |
|
"is_world_process_zero": true, |
|
"log_history": [ |
|
{ |
|
"epoch": 1.0, |
|
"learning_rate": 9.997697221833061e-06, |
|
"loss": 0.5641, |
|
"step": 59 |
|
}, |
|
{ |
|
"epoch": 1.0, |
|
"eval_accuracy": 0.75, |
|
"eval_f1": 0.0, |
|
"eval_loss": 0.5259643793106079, |
|
"eval_precision": 0.0, |
|
"eval_recall": 0.0, |
|
"eval_runtime": 1.0571, |
|
"eval_samples_per_second": 253.522, |
|
"eval_steps_per_second": 4.73, |
|
"step": 59 |
|
}, |
|
{ |
|
"epoch": 2.0, |
|
"learning_rate": 9.990465155165683e-06, |
|
"loss": 0.5317, |
|
"step": 118 |
|
}, |
|
{ |
|
"epoch": 2.0, |
|
"eval_accuracy": 0.75, |
|
"eval_f1": 0.0, |
|
"eval_loss": 0.5029988288879395, |
|
"eval_precision": 0.0, |
|
"eval_recall": 0.0, |
|
"eval_runtime": 1.053, |
|
"eval_samples_per_second": 254.519, |
|
"eval_steps_per_second": 4.748, |
|
"step": 118 |
|
}, |
|
{ |
|
"epoch": 3.0, |
|
"learning_rate": 9.978555124138569e-06, |
|
"loss": 0.4995, |
|
"step": 177 |
|
}, |
|
{ |
|
"epoch": 3.0, |
|
"eval_accuracy": 0.75, |
|
"eval_f1": 0.0, |
|
"eval_loss": 0.4655507504940033, |
|
"eval_precision": 0.0, |
|
"eval_recall": 0.0, |
|
"eval_runtime": 1.0523, |
|
"eval_samples_per_second": 254.669, |
|
"eval_steps_per_second": 4.751, |
|
"step": 177 |
|
}, |
|
{ |
|
"epoch": 4.0, |
|
"learning_rate": 9.961568226140335e-06, |
|
"loss": 0.4599, |
|
"step": 236 |
|
}, |
|
{ |
|
"epoch": 4.0, |
|
"eval_accuracy": 0.7686567164179104, |
|
"eval_f1": 0.6025641025641025, |
|
"eval_loss": 0.4502911865711212, |
|
"eval_precision": 0.5280898876404494, |
|
"eval_recall": 0.7014925373134329, |
|
"eval_runtime": 1.057, |
|
"eval_samples_per_second": 253.552, |
|
"eval_steps_per_second": 4.73, |
|
"step": 236 |
|
}, |
|
{ |
|
"epoch": 5.0, |
|
"learning_rate": 9.93968485932029e-06, |
|
"loss": 0.4082, |
|
"step": 295 |
|
}, |
|
{ |
|
"epoch": 5.0, |
|
"eval_accuracy": 0.8470149253731343, |
|
"eval_f1": 0.6434782608695653, |
|
"eval_loss": 0.378521591424942, |
|
"eval_precision": 0.7708333333333334, |
|
"eval_recall": 0.5522388059701493, |
|
"eval_runtime": 1.0544, |
|
"eval_samples_per_second": 254.183, |
|
"eval_steps_per_second": 4.742, |
|
"step": 295 |
|
}, |
|
{ |
|
"epoch": 6.0, |
|
"learning_rate": 9.912926619919478e-06, |
|
"loss": 0.3274, |
|
"step": 354 |
|
}, |
|
{ |
|
"epoch": 6.0, |
|
"eval_accuracy": 0.8619402985074627, |
|
"eval_f1": 0.6991869918699187, |
|
"eval_loss": 0.3604646623134613, |
|
"eval_precision": 0.7678571428571429, |
|
"eval_recall": 0.6417910447761194, |
|
"eval_runtime": 1.0555, |
|
"eval_samples_per_second": 253.908, |
|
"eval_steps_per_second": 4.737, |
|
"step": 354 |
|
}, |
|
{ |
|
"epoch": 7.0, |
|
"learning_rate": 9.881895849126432e-06, |
|
"loss": 0.2621, |
|
"step": 413 |
|
}, |
|
{ |
|
"epoch": 7.0, |
|
"eval_accuracy": 0.8619402985074627, |
|
"eval_f1": 0.6837606837606838, |
|
"eval_loss": 0.3764938712120056, |
|
"eval_precision": 0.8, |
|
"eval_recall": 0.5970149253731343, |
|
"eval_runtime": 1.0562, |
|
"eval_samples_per_second": 253.732, |
|
"eval_steps_per_second": 4.734, |
|
"step": 413 |
|
}, |
|
{ |
|
"epoch": 8.0, |
|
"learning_rate": 9.845553233485602e-06, |
|
"loss": 0.2332, |
|
"step": 472 |
|
}, |
|
{ |
|
"epoch": 8.0, |
|
"eval_accuracy": 0.8768656716417911, |
|
"eval_f1": 0.759124087591241, |
|
"eval_loss": 0.34082189202308655, |
|
"eval_precision": 0.7428571428571429, |
|
"eval_recall": 0.7761194029850746, |
|
"eval_runtime": 1.0525, |
|
"eval_samples_per_second": 254.642, |
|
"eval_steps_per_second": 4.751, |
|
"step": 472 |
|
}, |
|
{ |
|
"epoch": 9.0, |
|
"learning_rate": 9.804428641814051e-06, |
|
"loss": 0.1579, |
|
"step": 531 |
|
}, |
|
{ |
|
"epoch": 9.0, |
|
"eval_accuracy": 0.8731343283582089, |
|
"eval_f1": 0.7213114754098361, |
|
"eval_loss": 0.43820273876190186, |
|
"eval_precision": 0.8, |
|
"eval_recall": 0.6567164179104478, |
|
"eval_runtime": 1.055, |
|
"eval_samples_per_second": 254.04, |
|
"eval_steps_per_second": 4.74, |
|
"step": 531 |
|
}, |
|
{ |
|
"epoch": 10.0, |
|
"learning_rate": 9.75856265911873e-06, |
|
"loss": 0.1467, |
|
"step": 590 |
|
}, |
|
{ |
|
"epoch": 10.0, |
|
"eval_accuracy": 0.8805970149253731, |
|
"eval_f1": 0.7894736842105264, |
|
"eval_loss": 0.38548171520233154, |
|
"eval_precision": 0.7058823529411765, |
|
"eval_recall": 0.8955223880597015, |
|
"eval_runtime": 1.053, |
|
"eval_samples_per_second": 254.501, |
|
"eval_steps_per_second": 4.748, |
|
"step": 590 |
|
}, |
|
{ |
|
"epoch": 11.0, |
|
"learning_rate": 9.708000549587091e-06, |
|
"loss": 0.098, |
|
"step": 649 |
|
}, |
|
{ |
|
"epoch": 11.0, |
|
"eval_accuracy": 0.8805970149253731, |
|
"eval_f1": 0.7500000000000001, |
|
"eval_loss": 0.46932676434516907, |
|
"eval_precision": 0.7868852459016393, |
|
"eval_recall": 0.7164179104477612, |
|
"eval_runtime": 1.058, |
|
"eval_samples_per_second": 253.305, |
|
"eval_steps_per_second": 4.726, |
|
"step": 649 |
|
}, |
|
{ |
|
"epoch": 12.0, |
|
"learning_rate": 9.653766360237254e-06, |
|
"loss": 0.0929, |
|
"step": 708 |
|
}, |
|
{ |
|
"epoch": 12.0, |
|
"eval_accuracy": 0.8805970149253731, |
|
"eval_f1": 0.7333333333333334, |
|
"eval_loss": 0.6206381916999817, |
|
"eval_precision": 0.8301886792452831, |
|
"eval_recall": 0.6567164179104478, |
|
"eval_runtime": 1.0526, |
|
"eval_samples_per_second": 254.603, |
|
"eval_steps_per_second": 4.75, |
|
"step": 708 |
|
}, |
|
{ |
|
"epoch": 13.0, |
|
"learning_rate": 9.594043625628571e-06, |
|
"loss": 0.0555, |
|
"step": 767 |
|
}, |
|
{ |
|
"epoch": 13.0, |
|
"eval_accuracy": 0.8843283582089553, |
|
"eval_f1": 0.7633587786259542, |
|
"eval_loss": 0.7134280800819397, |
|
"eval_precision": 0.78125, |
|
"eval_recall": 0.746268656716418, |
|
"eval_runtime": 1.054, |
|
"eval_samples_per_second": 254.279, |
|
"eval_steps_per_second": 4.744, |
|
"step": 767 |
|
}, |
|
{ |
|
"epoch": 13.0, |
|
"step": 767, |
|
"total_flos": 1605898326389760.0, |
|
"train_loss": 0.2951739639471221, |
|
"train_runtime": 432.0494, |
|
"train_samples_per_second": 434.673, |
|
"train_steps_per_second": 13.656 |
|
} |
|
], |
|
"logging_steps": 500, |
|
"max_steps": 5900, |
|
"num_input_tokens_seen": 0, |
|
"num_train_epochs": 100, |
|
"save_steps": 500, |
|
"total_flos": 1605898326389760.0, |
|
"train_batch_size": 32, |
|
"trial_name": null, |
|
"trial_params": null |
|
} |
|
|