|
{ |
|
"best_metric": null, |
|
"best_model_checkpoint": null, |
|
"epoch": 18.06451612903226, |
|
"global_step": 140, |
|
"is_hyper_param_search": false, |
|
"is_local_process_zero": true, |
|
"is_world_process_zero": true, |
|
"log_history": [ |
|
{ |
|
"epoch": 0.9, |
|
"eval_accuracy": 0.7258883248730964, |
|
"eval_f1": 0.0, |
|
"eval_loss": 1.5211623907089233, |
|
"eval_precision": 0.0, |
|
"eval_recall": 0.0, |
|
"eval_runtime": 0.0934, |
|
"eval_samples_per_second": 85.695, |
|
"eval_steps_per_second": 10.712, |
|
"step": 7 |
|
}, |
|
{ |
|
"epoch": 1.94, |
|
"eval_accuracy": 0.7326565143824028, |
|
"eval_f1": 0.0, |
|
"eval_loss": 1.0808664560317993, |
|
"eval_precision": 0.0, |
|
"eval_recall": 0.0, |
|
"eval_runtime": 0.075, |
|
"eval_samples_per_second": 106.603, |
|
"eval_steps_per_second": 13.325, |
|
"step": 15 |
|
}, |
|
{ |
|
"epoch": 2.97, |
|
"eval_accuracy": 0.7681895093062606, |
|
"eval_f1": 0.17142857142857143, |
|
"eval_loss": 0.902431309223175, |
|
"eval_precision": 0.2, |
|
"eval_recall": 0.15, |
|
"eval_runtime": 0.0865, |
|
"eval_samples_per_second": 92.481, |
|
"eval_steps_per_second": 11.56, |
|
"step": 23 |
|
}, |
|
{ |
|
"epoch": 4.0, |
|
"eval_accuracy": 0.7969543147208121, |
|
"eval_f1": 0.2518518518518518, |
|
"eval_loss": 0.7922185063362122, |
|
"eval_precision": 0.22666666666666666, |
|
"eval_recall": 0.2833333333333333, |
|
"eval_runtime": 0.0722, |
|
"eval_samples_per_second": 110.797, |
|
"eval_steps_per_second": 13.85, |
|
"step": 31 |
|
}, |
|
{ |
|
"epoch": 4.9, |
|
"eval_accuracy": 0.8155668358714044, |
|
"eval_f1": 0.32876712328767127, |
|
"eval_loss": 0.7233745455741882, |
|
"eval_precision": 0.27906976744186046, |
|
"eval_recall": 0.4, |
|
"eval_runtime": 0.0672, |
|
"eval_samples_per_second": 118.965, |
|
"eval_steps_per_second": 14.871, |
|
"step": 38 |
|
}, |
|
{ |
|
"epoch": 5.94, |
|
"eval_accuracy": 0.8358714043993232, |
|
"eval_f1": 0.4305555555555556, |
|
"eval_loss": 0.6560729146003723, |
|
"eval_precision": 0.36904761904761907, |
|
"eval_recall": 0.5166666666666667, |
|
"eval_runtime": 0.0878, |
|
"eval_samples_per_second": 91.083, |
|
"eval_steps_per_second": 11.385, |
|
"step": 46 |
|
}, |
|
{ |
|
"epoch": 6.97, |
|
"eval_accuracy": 0.8443316412859561, |
|
"eval_f1": 0.4347826086956522, |
|
"eval_loss": 0.626990795135498, |
|
"eval_precision": 0.38461538461538464, |
|
"eval_recall": 0.5, |
|
"eval_runtime": 0.0846, |
|
"eval_samples_per_second": 94.599, |
|
"eval_steps_per_second": 11.825, |
|
"step": 54 |
|
}, |
|
{ |
|
"epoch": 8.0, |
|
"eval_accuracy": 0.8494077834179357, |
|
"eval_f1": 0.48951048951048953, |
|
"eval_loss": 0.5750179886817932, |
|
"eval_precision": 0.42168674698795183, |
|
"eval_recall": 0.5833333333333334, |
|
"eval_runtime": 0.0711, |
|
"eval_samples_per_second": 112.546, |
|
"eval_steps_per_second": 14.068, |
|
"step": 62 |
|
}, |
|
{ |
|
"epoch": 8.9, |
|
"eval_accuracy": 0.8595600676818951, |
|
"eval_f1": 0.5109489051094891, |
|
"eval_loss": 0.5483719110488892, |
|
"eval_precision": 0.45454545454545453, |
|
"eval_recall": 0.5833333333333334, |
|
"eval_runtime": 0.104, |
|
"eval_samples_per_second": 76.947, |
|
"eval_steps_per_second": 9.618, |
|
"step": 69 |
|
}, |
|
{ |
|
"epoch": 9.94, |
|
"eval_accuracy": 0.8629441624365483, |
|
"eval_f1": 0.5285714285714286, |
|
"eval_loss": 0.5253370404243469, |
|
"eval_precision": 0.4625, |
|
"eval_recall": 0.6166666666666667, |
|
"eval_runtime": 0.0872, |
|
"eval_samples_per_second": 91.721, |
|
"eval_steps_per_second": 11.465, |
|
"step": 77 |
|
}, |
|
{ |
|
"epoch": 10.97, |
|
"eval_accuracy": 0.868020304568528, |
|
"eval_f1": 0.5179856115107914, |
|
"eval_loss": 0.5097917914390564, |
|
"eval_precision": 0.45569620253164556, |
|
"eval_recall": 0.6, |
|
"eval_runtime": 0.0862, |
|
"eval_samples_per_second": 92.832, |
|
"eval_steps_per_second": 11.604, |
|
"step": 85 |
|
}, |
|
{ |
|
"epoch": 12.0, |
|
"eval_accuracy": 0.8781725888324873, |
|
"eval_f1": 0.5547445255474452, |
|
"eval_loss": 0.49227389693260193, |
|
"eval_precision": 0.4935064935064935, |
|
"eval_recall": 0.6333333333333333, |
|
"eval_runtime": 0.0683, |
|
"eval_samples_per_second": 117.18, |
|
"eval_steps_per_second": 14.647, |
|
"step": 93 |
|
}, |
|
{ |
|
"epoch": 12.9, |
|
"eval_accuracy": 0.868020304568528, |
|
"eval_f1": 0.5294117647058824, |
|
"eval_loss": 0.49868977069854736, |
|
"eval_precision": 0.47368421052631576, |
|
"eval_recall": 0.6, |
|
"eval_runtime": 0.0863, |
|
"eval_samples_per_second": 92.658, |
|
"eval_steps_per_second": 11.582, |
|
"step": 100 |
|
}, |
|
{ |
|
"epoch": 13.94, |
|
"eval_accuracy": 0.871404399323181, |
|
"eval_f1": 0.5652173913043479, |
|
"eval_loss": 0.5003769397735596, |
|
"eval_precision": 0.5, |
|
"eval_recall": 0.65, |
|
"eval_runtime": 0.0861, |
|
"eval_samples_per_second": 92.934, |
|
"eval_steps_per_second": 11.617, |
|
"step": 108 |
|
}, |
|
{ |
|
"epoch": 14.97, |
|
"eval_accuracy": 0.8815566835871405, |
|
"eval_f1": 0.5588235294117647, |
|
"eval_loss": 0.48066699504852295, |
|
"eval_precision": 0.5, |
|
"eval_recall": 0.6333333333333333, |
|
"eval_runtime": 0.073, |
|
"eval_samples_per_second": 109.637, |
|
"eval_steps_per_second": 13.705, |
|
"step": 116 |
|
}, |
|
{ |
|
"epoch": 16.0, |
|
"eval_accuracy": 0.8798646362098139, |
|
"eval_f1": 0.5481481481481482, |
|
"eval_loss": 0.48719707131385803, |
|
"eval_precision": 0.49333333333333335, |
|
"eval_recall": 0.6166666666666667, |
|
"eval_runtime": 0.0729, |
|
"eval_samples_per_second": 109.707, |
|
"eval_steps_per_second": 13.713, |
|
"step": 124 |
|
}, |
|
{ |
|
"epoch": 16.9, |
|
"eval_accuracy": 0.8866328257191202, |
|
"eval_f1": 0.6029411764705882, |
|
"eval_loss": 0.48052239418029785, |
|
"eval_precision": 0.5394736842105263, |
|
"eval_recall": 0.6833333333333333, |
|
"eval_runtime": 0.0836, |
|
"eval_samples_per_second": 95.684, |
|
"eval_steps_per_second": 11.96, |
|
"step": 131 |
|
}, |
|
{ |
|
"epoch": 17.94, |
|
"eval_accuracy": 0.8866328257191202, |
|
"eval_f1": 0.5882352941176471, |
|
"eval_loss": 0.48192963004112244, |
|
"eval_precision": 0.5263157894736842, |
|
"eval_recall": 0.6666666666666666, |
|
"eval_runtime": 0.0874, |
|
"eval_samples_per_second": 91.531, |
|
"eval_steps_per_second": 11.441, |
|
"step": 139 |
|
}, |
|
{ |
|
"epoch": 18.06, |
|
"eval_accuracy": 0.8866328257191202, |
|
"eval_f1": 0.5882352941176471, |
|
"eval_loss": 0.48198172450065613, |
|
"eval_precision": 0.5263157894736842, |
|
"eval_recall": 0.6666666666666666, |
|
"eval_runtime": 0.0703, |
|
"eval_samples_per_second": 113.867, |
|
"eval_steps_per_second": 14.233, |
|
"step": 140 |
|
}, |
|
{ |
|
"epoch": 18.06, |
|
"step": 140, |
|
"total_flos": 142825785914880.0, |
|
"train_loss": 0.5361384800502232, |
|
"train_runtime": 994.5385, |
|
"train_samples_per_second": 2.433, |
|
"train_steps_per_second": 0.141 |
|
} |
|
], |
|
"max_steps": 140, |
|
"num_train_epochs": 20, |
|
"total_flos": 142825785914880.0, |
|
"trial_name": null, |
|
"trial_params": null |
|
} |
|
|