Md Mushfiqur Rahman
Upload with huggingface_hub
560f5a7
{
"best_metric": 0.8868703550784476,
"best_model_checkpoint": "/scratch/mrahma45/pixel/finetuned_models/mbert/mbert-base-finetuned-masakhaner-ibo/checkpoint-3000",
"epoch": 74.28571428571429,
"global_step": 5200,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 2.86,
"eval_accuracy_score": 0.9765228426395939,
"eval_f1": 0.8673300165837479,
"eval_loss": 0.08876766264438629,
"eval_precision": 0.863036303630363,
"eval_recall": 0.8716666666666667,
"eval_runtime": 4.4473,
"eval_samples_per_second": 71.954,
"eval_steps_per_second": 8.994,
"step": 200
},
{
"epoch": 5.71,
"eval_accuracy_score": 0.9741434010152284,
"eval_f1": 0.8617886178861788,
"eval_loss": 0.11480691283941269,
"eval_precision": 0.8412698412698413,
"eval_recall": 0.8833333333333333,
"eval_runtime": 4.4462,
"eval_samples_per_second": 71.972,
"eval_steps_per_second": 8.997,
"step": 400
},
{
"epoch": 7.14,
"learning_rate": 4.865771812080537e-05,
"loss": 0.1451,
"step": 500
},
{
"epoch": 8.57,
"eval_accuracy_score": 0.9781091370558376,
"eval_f1": 0.874074074074074,
"eval_loss": 0.10442519187927246,
"eval_precision": 0.8634146341463415,
"eval_recall": 0.885,
"eval_runtime": 4.449,
"eval_samples_per_second": 71.926,
"eval_steps_per_second": 8.991,
"step": 600
},
{
"epoch": 11.43,
"eval_accuracy_score": 0.9766814720812182,
"eval_f1": 0.8705688375927452,
"eval_loss": 0.11804218590259552,
"eval_precision": 0.8613376835236541,
"eval_recall": 0.88,
"eval_runtime": 4.4511,
"eval_samples_per_second": 71.893,
"eval_steps_per_second": 8.987,
"step": 800
},
{
"epoch": 14.29,
"learning_rate": 4.697986577181208e-05,
"loss": 0.0084,
"step": 1000
},
{
"epoch": 14.29,
"eval_accuracy_score": 0.9746192893401016,
"eval_f1": 0.8457047539616346,
"eval_loss": 0.1311611831188202,
"eval_precision": 0.8464106844741235,
"eval_recall": 0.845,
"eval_runtime": 4.4345,
"eval_samples_per_second": 72.162,
"eval_steps_per_second": 9.02,
"step": 1000
},
{
"epoch": 17.14,
"eval_accuracy_score": 0.9763642131979695,
"eval_f1": 0.8714168714168715,
"eval_loss": 0.134602889418602,
"eval_precision": 0.856682769726248,
"eval_recall": 0.8866666666666667,
"eval_runtime": 4.4493,
"eval_samples_per_second": 71.921,
"eval_steps_per_second": 8.99,
"step": 1200
},
{
"epoch": 20.0,
"eval_accuracy_score": 0.9803299492385786,
"eval_f1": 0.8872180451127819,
"eval_loss": 0.1307426393032074,
"eval_precision": 0.8894472361809045,
"eval_recall": 0.885,
"eval_runtime": 4.442,
"eval_samples_per_second": 72.039,
"eval_steps_per_second": 9.005,
"step": 1400
},
{
"epoch": 21.43,
"learning_rate": 4.530201342281879e-05,
"loss": 0.005,
"step": 1500
},
{
"epoch": 22.86,
"eval_accuracy_score": 0.9771573604060914,
"eval_f1": 0.8767576509511993,
"eval_loss": 0.14564308524131775,
"eval_precision": 0.8702791461412152,
"eval_recall": 0.8833333333333333,
"eval_runtime": 4.4473,
"eval_samples_per_second": 71.954,
"eval_steps_per_second": 8.994,
"step": 1600
},
{
"epoch": 25.71,
"eval_accuracy_score": 0.9771573604060914,
"eval_f1": 0.8782104391052196,
"eval_loss": 0.13427743315696716,
"eval_precision": 0.8731466227347611,
"eval_recall": 0.8833333333333333,
"eval_runtime": 4.443,
"eval_samples_per_second": 72.023,
"eval_steps_per_second": 9.003,
"step": 1800
},
{
"epoch": 28.57,
"learning_rate": 4.36241610738255e-05,
"loss": 0.0039,
"step": 2000
},
{
"epoch": 28.57,
"eval_accuracy_score": 0.9762055837563451,
"eval_f1": 0.8687707641196013,
"eval_loss": 0.15129442512989044,
"eval_precision": 0.8658940397350994,
"eval_recall": 0.8716666666666667,
"eval_runtime": 4.4359,
"eval_samples_per_second": 72.139,
"eval_steps_per_second": 9.017,
"step": 2000
},
{
"epoch": 31.43,
"eval_accuracy_score": 0.9750951776649747,
"eval_f1": 0.8700754400670577,
"eval_loss": 0.16774575412273407,
"eval_precision": 0.8752107925801011,
"eval_recall": 0.865,
"eval_runtime": 4.4409,
"eval_samples_per_second": 72.057,
"eval_steps_per_second": 9.007,
"step": 2200
},
{
"epoch": 34.29,
"eval_accuracy_score": 0.9749365482233503,
"eval_f1": 0.8601973684210527,
"eval_loss": 0.1633668839931488,
"eval_precision": 0.849025974025974,
"eval_recall": 0.8716666666666667,
"eval_runtime": 4.4452,
"eval_samples_per_second": 71.988,
"eval_steps_per_second": 8.998,
"step": 2400
},
{
"epoch": 35.71,
"learning_rate": 4.194630872483222e-05,
"loss": 0.0036,
"step": 2500
},
{
"epoch": 37.14,
"eval_accuracy_score": 0.9766814720812182,
"eval_f1": 0.8782104391052196,
"eval_loss": 0.16212213039398193,
"eval_precision": 0.8731466227347611,
"eval_recall": 0.8833333333333333,
"eval_runtime": 4.4427,
"eval_samples_per_second": 72.028,
"eval_steps_per_second": 9.004,
"step": 2600
},
{
"epoch": 40.0,
"eval_accuracy_score": 0.9763642131979695,
"eval_f1": 0.8719665271966527,
"eval_loss": 0.16754868626594543,
"eval_precision": 0.8756302521008403,
"eval_recall": 0.8683333333333333,
"eval_runtime": 4.4401,
"eval_samples_per_second": 72.07,
"eval_steps_per_second": 9.009,
"step": 2800
},
{
"epoch": 42.86,
"learning_rate": 4.026845637583892e-05,
"loss": 0.0023,
"step": 3000
},
{
"epoch": 42.86,
"eval_accuracy_score": 0.9790609137055838,
"eval_f1": 0.8868703550784476,
"eval_loss": 0.14278778433799744,
"eval_precision": 0.8788870703764321,
"eval_recall": 0.895,
"eval_runtime": 4.4323,
"eval_samples_per_second": 72.197,
"eval_steps_per_second": 9.025,
"step": 3000
},
{
"epoch": 45.71,
"eval_accuracy_score": 0.9782677664974619,
"eval_f1": 0.8855721393034827,
"eval_loss": 0.14296667277812958,
"eval_precision": 0.8811881188118812,
"eval_recall": 0.89,
"eval_runtime": 4.4374,
"eval_samples_per_second": 72.114,
"eval_steps_per_second": 9.014,
"step": 3200
},
{
"epoch": 48.57,
"eval_accuracy_score": 0.9781091370558376,
"eval_f1": 0.8870703764320785,
"eval_loss": 0.14033867418766022,
"eval_precision": 0.8713826366559485,
"eval_recall": 0.9033333333333333,
"eval_runtime": 4.4359,
"eval_samples_per_second": 72.138,
"eval_steps_per_second": 9.017,
"step": 3400
},
{
"epoch": 50.0,
"learning_rate": 3.859060402684564e-05,
"loss": 0.0026,
"step": 3500
},
{
"epoch": 51.43,
"eval_accuracy_score": 0.9749365482233503,
"eval_f1": 0.8693467336683417,
"eval_loss": 0.18670859932899475,
"eval_precision": 0.8737373737373737,
"eval_recall": 0.865,
"eval_runtime": 4.4362,
"eval_samples_per_second": 72.133,
"eval_steps_per_second": 9.017,
"step": 3600
},
{
"epoch": 54.29,
"eval_accuracy_score": 0.9803299492385786,
"eval_f1": 0.8937908496732027,
"eval_loss": 0.1545487940311432,
"eval_precision": 0.8766025641025641,
"eval_recall": 0.9116666666666666,
"eval_runtime": 4.4428,
"eval_samples_per_second": 72.027,
"eval_steps_per_second": 9.003,
"step": 3800
},
{
"epoch": 57.14,
"learning_rate": 3.6912751677852356e-05,
"loss": 0.0021,
"step": 4000
},
{
"epoch": 57.14,
"eval_accuracy_score": 0.975253807106599,
"eval_f1": 0.8647302904564315,
"eval_loss": 0.1578870564699173,
"eval_precision": 0.8611570247933884,
"eval_recall": 0.8683333333333333,
"eval_runtime": 4.4357,
"eval_samples_per_second": 72.143,
"eval_steps_per_second": 9.018,
"step": 4000
},
{
"epoch": 60.0,
"eval_accuracy_score": 0.9792195431472082,
"eval_f1": 0.8872305140961857,
"eval_loss": 0.14871039986610413,
"eval_precision": 0.8828382838283828,
"eval_recall": 0.8916666666666667,
"eval_runtime": 4.4317,
"eval_samples_per_second": 72.207,
"eval_steps_per_second": 9.026,
"step": 4200
},
{
"epoch": 62.86,
"eval_accuracy_score": 0.9758883248730964,
"eval_f1": 0.865546218487395,
"eval_loss": 0.16632404923439026,
"eval_precision": 0.8728813559322034,
"eval_recall": 0.8583333333333333,
"eval_runtime": 4.4414,
"eval_samples_per_second": 72.05,
"eval_steps_per_second": 9.006,
"step": 4400
},
{
"epoch": 64.29,
"learning_rate": 3.523489932885906e-05,
"loss": 0.0026,
"step": 4500
},
{
"epoch": 65.71,
"eval_accuracy_score": 0.9747779187817259,
"eval_f1": 0.865721434528774,
"eval_loss": 0.15900883078575134,
"eval_precision": 0.8664440734557596,
"eval_recall": 0.865,
"eval_runtime": 4.441,
"eval_samples_per_second": 72.055,
"eval_steps_per_second": 9.007,
"step": 4600
},
{
"epoch": 68.57,
"eval_accuracy_score": 0.9789022842639594,
"eval_f1": 0.8827470686767169,
"eval_loss": 0.16089987754821777,
"eval_precision": 0.8872053872053872,
"eval_recall": 0.8783333333333333,
"eval_runtime": 4.4442,
"eval_samples_per_second": 72.004,
"eval_steps_per_second": 9.001,
"step": 4800
},
{
"epoch": 71.43,
"learning_rate": 3.3557046979865775e-05,
"loss": 0.0017,
"step": 5000
},
{
"epoch": 71.43,
"eval_accuracy_score": 0.9750951776649747,
"eval_f1": 0.8611339359079703,
"eval_loss": 0.1948554664850235,
"eval_precision": 0.8492706645056726,
"eval_recall": 0.8733333333333333,
"eval_runtime": 12.3435,
"eval_samples_per_second": 25.925,
"eval_steps_per_second": 3.241,
"step": 5000
},
{
"epoch": 74.29,
"eval_accuracy_score": 0.9777918781725888,
"eval_f1": 0.886158886158886,
"eval_loss": 0.15537256002426147,
"eval_precision": 0.8711755233494364,
"eval_recall": 0.9016666666666666,
"eval_runtime": 4.4385,
"eval_samples_per_second": 72.096,
"eval_steps_per_second": 9.012,
"step": 5200
},
{
"epoch": 74.29,
"step": 5200,
"total_flos": 2.169292304429568e+16,
"train_loss": 0.01710937021443477,
"train_runtime": 8154.5313,
"train_samples_per_second": 58.863,
"train_steps_per_second": 1.839
}
],
"max_steps": 15000,
"num_train_epochs": 215,
"total_flos": 2.169292304429568e+16,
"trial_name": null,
"trial_params": null
}