|
{ |
|
"best_metric": 0.2427176833152771, |
|
"best_model_checkpoint": "/content/dnrti_securebert/checkpoint-4500", |
|
"epoch": 10.0, |
|
"eval_steps": 500, |
|
"global_step": 6570, |
|
"is_hyper_param_search": false, |
|
"is_local_process_zero": true, |
|
"is_world_process_zero": true, |
|
"log_history": [ |
|
{ |
|
"epoch": 0.76, |
|
"learning_rate": 1.8477929984779303e-05, |
|
"loss": 0.7821, |
|
"step": 500 |
|
}, |
|
{ |
|
"epoch": 0.76, |
|
"eval_accuracy": 0.8744877049180327, |
|
"eval_f1": 0.5547161666306928, |
|
"eval_loss": 0.4215104579925537, |
|
"eval_precision": 0.5219333874898456, |
|
"eval_recall": 0.5918931368033165, |
|
"eval_runtime": 3.0633, |
|
"eval_samples_per_second": 215.778, |
|
"eval_steps_per_second": 27.095, |
|
"step": 500 |
|
}, |
|
{ |
|
"epoch": 1.52, |
|
"learning_rate": 1.69558599695586e-05, |
|
"loss": 0.3559, |
|
"step": 1000 |
|
}, |
|
{ |
|
"epoch": 1.52, |
|
"eval_accuracy": 0.900785519125683, |
|
"eval_f1": 0.6425522354527072, |
|
"eval_loss": 0.31522974371910095, |
|
"eval_precision": 0.6271929824561403, |
|
"eval_recall": 0.6586826347305389, |
|
"eval_runtime": 2.5699, |
|
"eval_samples_per_second": 257.203, |
|
"eval_steps_per_second": 32.296, |
|
"step": 1000 |
|
}, |
|
{ |
|
"epoch": 2.28, |
|
"learning_rate": 1.54337899543379e-05, |
|
"loss": 0.2807, |
|
"step": 1500 |
|
}, |
|
{ |
|
"epoch": 2.28, |
|
"eval_accuracy": 0.9084130236794171, |
|
"eval_f1": 0.681571521597569, |
|
"eval_loss": 0.29523420333862305, |
|
"eval_precision": 0.6444991789819376, |
|
"eval_recall": 0.7231690465223399, |
|
"eval_runtime": 2.6375, |
|
"eval_samples_per_second": 250.619, |
|
"eval_steps_per_second": 31.47, |
|
"step": 1500 |
|
}, |
|
{ |
|
"epoch": 3.04, |
|
"learning_rate": 1.39117199391172e-05, |
|
"loss": 0.2272, |
|
"step": 2000 |
|
}, |
|
{ |
|
"epoch": 3.04, |
|
"eval_accuracy": 0.9160974499089253, |
|
"eval_f1": 0.707285342584562, |
|
"eval_loss": 0.2793317437171936, |
|
"eval_precision": 0.6681687832855387, |
|
"eval_recall": 0.7512666973744818, |
|
"eval_runtime": 3.0401, |
|
"eval_samples_per_second": 217.427, |
|
"eval_steps_per_second": 27.302, |
|
"step": 2000 |
|
}, |
|
{ |
|
"epoch": 3.81, |
|
"learning_rate": 1.2389649923896501e-05, |
|
"loss": 0.1837, |
|
"step": 2500 |
|
}, |
|
{ |
|
"epoch": 3.81, |
|
"eval_accuracy": 0.9258310564663024, |
|
"eval_f1": 0.7333931777378815, |
|
"eval_loss": 0.2489345222711563, |
|
"eval_precision": 0.7150984682713348, |
|
"eval_recall": 0.7526485490557346, |
|
"eval_runtime": 2.5725, |
|
"eval_samples_per_second": 256.952, |
|
"eval_steps_per_second": 32.265, |
|
"step": 2500 |
|
}, |
|
{ |
|
"epoch": 4.57, |
|
"learning_rate": 1.08675799086758e-05, |
|
"loss": 0.1497, |
|
"step": 3000 |
|
}, |
|
{ |
|
"epoch": 4.57, |
|
"eval_accuracy": 0.9285632969034608, |
|
"eval_f1": 0.7529359627742077, |
|
"eval_loss": 0.25113749504089355, |
|
"eval_precision": 0.7254483347566183, |
|
"eval_recall": 0.7825886688162137, |
|
"eval_runtime": 2.9682, |
|
"eval_samples_per_second": 222.691, |
|
"eval_steps_per_second": 27.963, |
|
"step": 3000 |
|
}, |
|
{ |
|
"epoch": 5.33, |
|
"learning_rate": 9.3455098934551e-06, |
|
"loss": 0.1371, |
|
"step": 3500 |
|
}, |
|
{ |
|
"epoch": 5.33, |
|
"eval_accuracy": 0.9331170309653917, |
|
"eval_f1": 0.7587294435683712, |
|
"eval_loss": 0.24962495267391205, |
|
"eval_precision": 0.7425044091710759, |
|
"eval_recall": 0.7756794104099494, |
|
"eval_runtime": 2.5966, |
|
"eval_samples_per_second": 254.564, |
|
"eval_steps_per_second": 31.965, |
|
"step": 3500 |
|
}, |
|
{ |
|
"epoch": 6.09, |
|
"learning_rate": 7.823439878234399e-06, |
|
"loss": 0.1135, |
|
"step": 4000 |
|
}, |
|
{ |
|
"epoch": 6.09, |
|
"eval_accuracy": 0.9325478142076503, |
|
"eval_f1": 0.7661713286713285, |
|
"eval_loss": 0.25536227226257324, |
|
"eval_precision": 0.7288981288981289, |
|
"eval_recall": 0.8074619990787656, |
|
"eval_runtime": 2.5496, |
|
"eval_samples_per_second": 259.252, |
|
"eval_steps_per_second": 32.554, |
|
"step": 4000 |
|
}, |
|
{ |
|
"epoch": 6.85, |
|
"learning_rate": 6.301369863013699e-06, |
|
"loss": 0.1018, |
|
"step": 4500 |
|
}, |
|
{ |
|
"epoch": 6.85, |
|
"eval_accuracy": 0.9382399817850637, |
|
"eval_f1": 0.7772965580123091, |
|
"eval_loss": 0.2427176833152771, |
|
"eval_precision": 0.769404332129964, |
|
"eval_recall": 0.7853523721787194, |
|
"eval_runtime": 2.5904, |
|
"eval_samples_per_second": 255.175, |
|
"eval_steps_per_second": 32.042, |
|
"step": 4500 |
|
}, |
|
{ |
|
"epoch": 7.61, |
|
"learning_rate": 4.779299847792998e-06, |
|
"loss": 0.0899, |
|
"step": 5000 |
|
}, |
|
{ |
|
"epoch": 7.61, |
|
"eval_accuracy": 0.9377846083788707, |
|
"eval_f1": 0.7864271457085829, |
|
"eval_loss": 0.2516387104988098, |
|
"eval_precision": 0.7583404619332763, |
|
"eval_recall": 0.8166743436204514, |
|
"eval_runtime": 2.5729, |
|
"eval_samples_per_second": 256.912, |
|
"eval_steps_per_second": 32.26, |
|
"step": 5000 |
|
}, |
|
{ |
|
"epoch": 8.37, |
|
"learning_rate": 3.2572298325722984e-06, |
|
"loss": 0.0809, |
|
"step": 5500 |
|
}, |
|
{ |
|
"epoch": 8.37, |
|
"eval_accuracy": 0.9405737704918032, |
|
"eval_f1": 0.7940058152538582, |
|
"eval_loss": 0.24588441848754883, |
|
"eval_precision": 0.7717391304347826, |
|
"eval_recall": 0.81759557807462, |
|
"eval_runtime": 2.5675, |
|
"eval_samples_per_second": 257.446, |
|
"eval_steps_per_second": 32.327, |
|
"step": 5500 |
|
}, |
|
{ |
|
"epoch": 9.13, |
|
"learning_rate": 1.7351598173515982e-06, |
|
"loss": 0.0763, |
|
"step": 6000 |
|
}, |
|
{ |
|
"epoch": 9.13, |
|
"eval_accuracy": 0.9392076502732241, |
|
"eval_f1": 0.7852112676056338, |
|
"eval_loss": 0.2552666962146759, |
|
"eval_precision": 0.7517909818794775, |
|
"eval_recall": 0.8217411331183786, |
|
"eval_runtime": 2.7364, |
|
"eval_samples_per_second": 241.554, |
|
"eval_steps_per_second": 30.331, |
|
"step": 6000 |
|
}, |
|
{ |
|
"epoch": 9.89, |
|
"learning_rate": 2.1308980213089802e-07, |
|
"loss": 0.0687, |
|
"step": 6500 |
|
}, |
|
{ |
|
"epoch": 9.89, |
|
"eval_accuracy": 0.9406876138433515, |
|
"eval_f1": 0.790150842945874, |
|
"eval_loss": 0.2534164488315582, |
|
"eval_precision": 0.7620881471972615, |
|
"eval_recall": 0.8203592814371258, |
|
"eval_runtime": 3.0206, |
|
"eval_samples_per_second": 218.833, |
|
"eval_steps_per_second": 27.478, |
|
"step": 6500 |
|
}, |
|
{ |
|
"epoch": 10.0, |
|
"step": 6570, |
|
"total_flos": 1395895287387240.0, |
|
"train_loss": 0.20224008327931212, |
|
"train_runtime": 907.9488, |
|
"train_samples_per_second": 57.823, |
|
"train_steps_per_second": 7.236 |
|
} |
|
], |
|
"logging_steps": 500, |
|
"max_steps": 6570, |
|
"num_train_epochs": 10, |
|
"save_steps": 500, |
|
"total_flos": 1395895287387240.0, |
|
"trial_name": null, |
|
"trial_params": null |
|
} |
|
|