|
{ |
|
"best_metric": 0.7295733911785972, |
|
"best_model_checkpoint": "Ernie-3.0-large-chinese-finetuned-ner/checkpoint-9072", |
|
"epoch": 36.0, |
|
"eval_steps": 500, |
|
"global_step": 9072, |
|
"is_hyper_param_search": false, |
|
"is_local_process_zero": true, |
|
"is_world_process_zero": true, |
|
"log_history": [ |
|
{ |
|
"epoch": 1.0, |
|
"learning_rate": 1.9600000000000002e-05, |
|
"loss": 0.7619, |
|
"step": 252 |
|
}, |
|
{ |
|
"epoch": 1.0, |
|
"eval_accuracy": 0.8891147174729265, |
|
"eval_f1": 0.5908584169453734, |
|
"eval_loss": 0.371647447347641, |
|
"eval_precision": 0.5302120848339336, |
|
"eval_recall": 0.6671701913393756, |
|
"eval_runtime": 30.5213, |
|
"eval_samples_per_second": 16.48, |
|
"eval_steps_per_second": 2.064, |
|
"step": 252 |
|
}, |
|
{ |
|
"epoch": 2.0, |
|
"learning_rate": 1.9200000000000003e-05, |
|
"loss": 0.3277, |
|
"step": 504 |
|
}, |
|
{ |
|
"epoch": 2.0, |
|
"eval_accuracy": 0.9043503894250163, |
|
"eval_f1": 0.6514158800666296, |
|
"eval_loss": 0.31230422854423523, |
|
"eval_precision": 0.5827538247566064, |
|
"eval_recall": 0.7384189325276939, |
|
"eval_runtime": 30.3199, |
|
"eval_samples_per_second": 16.59, |
|
"eval_steps_per_second": 2.078, |
|
"step": 504 |
|
}, |
|
{ |
|
"epoch": 3.0, |
|
"learning_rate": 1.88e-05, |
|
"loss": 0.2539, |
|
"step": 756 |
|
}, |
|
{ |
|
"epoch": 3.0, |
|
"eval_accuracy": 0.9070344741986534, |
|
"eval_f1": 0.6798141221806642, |
|
"eval_loss": 0.3259331285953522, |
|
"eval_precision": 0.6182230467944754, |
|
"eval_recall": 0.7550352467270897, |
|
"eval_runtime": 31.8667, |
|
"eval_samples_per_second": 15.785, |
|
"eval_steps_per_second": 1.977, |
|
"step": 756 |
|
}, |
|
{ |
|
"epoch": 4.0, |
|
"learning_rate": 1.8400000000000003e-05, |
|
"loss": 0.209, |
|
"step": 1008 |
|
}, |
|
{ |
|
"epoch": 4.0, |
|
"eval_accuracy": 0.899121854345735, |
|
"eval_f1": 0.6714031971580817, |
|
"eval_loss": 0.3699039816856384, |
|
"eval_precision": 0.6004765687053217, |
|
"eval_recall": 0.7613293051359517, |
|
"eval_runtime": 29.8895, |
|
"eval_samples_per_second": 16.829, |
|
"eval_steps_per_second": 2.108, |
|
"step": 1008 |
|
}, |
|
{ |
|
"epoch": 5.0, |
|
"learning_rate": 1.8e-05, |
|
"loss": 0.1696, |
|
"step": 1260 |
|
}, |
|
{ |
|
"epoch": 5.0, |
|
"eval_accuracy": 0.9081980947652589, |
|
"eval_f1": 0.7022252810277587, |
|
"eval_loss": 0.35198503732681274, |
|
"eval_precision": 0.6449641803624104, |
|
"eval_recall": 0.7706445115810675, |
|
"eval_runtime": 31.5563, |
|
"eval_samples_per_second": 15.94, |
|
"eval_steps_per_second": 1.996, |
|
"step": 1260 |
|
}, |
|
{ |
|
"epoch": 6.0, |
|
"learning_rate": 1.76e-05, |
|
"loss": 0.1394, |
|
"step": 1512 |
|
}, |
|
{ |
|
"epoch": 6.0, |
|
"eval_accuracy": 0.9099047382629473, |
|
"eval_f1": 0.6968929804372841, |
|
"eval_loss": 0.36153343319892883, |
|
"eval_precision": 0.6417973717676981, |
|
"eval_recall": 0.7623363544813696, |
|
"eval_runtime": 30.5397, |
|
"eval_samples_per_second": 16.47, |
|
"eval_steps_per_second": 2.063, |
|
"step": 1512 |
|
}, |
|
{ |
|
"epoch": 7.0, |
|
"learning_rate": 1.72e-05, |
|
"loss": 0.1184, |
|
"step": 1764 |
|
}, |
|
{ |
|
"epoch": 7.0, |
|
"eval_accuracy": 0.9082911844105874, |
|
"eval_f1": 0.7067113318701628, |
|
"eval_loss": 0.37900495529174805, |
|
"eval_precision": 0.6529348986125934, |
|
"eval_recall": 0.7701409869083585, |
|
"eval_runtime": 30.8222, |
|
"eval_samples_per_second": 16.319, |
|
"eval_steps_per_second": 2.044, |
|
"step": 1764 |
|
}, |
|
{ |
|
"epoch": 8.0, |
|
"learning_rate": 1.6800000000000002e-05, |
|
"loss": 0.1011, |
|
"step": 2016 |
|
}, |
|
{ |
|
"epoch": 8.0, |
|
"eval_accuracy": 0.9137214137214137, |
|
"eval_f1": 0.7153439153439154, |
|
"eval_loss": 0.38163959980010986, |
|
"eval_precision": 0.671078755790867, |
|
"eval_recall": 0.7658610271903323, |
|
"eval_runtime": 30.6484, |
|
"eval_samples_per_second": 16.412, |
|
"eval_steps_per_second": 2.056, |
|
"step": 2016 |
|
}, |
|
{ |
|
"epoch": 9.0, |
|
"learning_rate": 1.64e-05, |
|
"loss": 0.0853, |
|
"step": 2268 |
|
}, |
|
{ |
|
"epoch": 9.0, |
|
"eval_accuracy": 0.9104477611940298, |
|
"eval_f1": 0.7113811638233232, |
|
"eval_loss": 0.4221731722354889, |
|
"eval_precision": 0.6637592673353685, |
|
"eval_recall": 0.7663645518630413, |
|
"eval_runtime": 29.8305, |
|
"eval_samples_per_second": 16.862, |
|
"eval_steps_per_second": 2.112, |
|
"step": 2268 |
|
}, |
|
{ |
|
"epoch": 10.0, |
|
"learning_rate": 1.6000000000000003e-05, |
|
"loss": 0.0726, |
|
"step": 2520 |
|
}, |
|
{ |
|
"epoch": 10.0, |
|
"eval_accuracy": 0.9108201197753436, |
|
"eval_f1": 0.7088488276187108, |
|
"eval_loss": 0.45063257217407227, |
|
"eval_precision": 0.6662236987818383, |
|
"eval_recall": 0.75730110775428, |
|
"eval_runtime": 31.119, |
|
"eval_samples_per_second": 16.164, |
|
"eval_steps_per_second": 2.024, |
|
"step": 2520 |
|
}, |
|
{ |
|
"epoch": 11.0, |
|
"learning_rate": 1.5600000000000003e-05, |
|
"loss": 0.0625, |
|
"step": 2772 |
|
}, |
|
{ |
|
"epoch": 11.0, |
|
"eval_accuracy": 0.9118596208148447, |
|
"eval_f1": 0.7197667638483967, |
|
"eval_loss": 0.465919554233551, |
|
"eval_precision": 0.6704323267434282, |
|
"eval_recall": 0.7769385699899295, |
|
"eval_runtime": 30.3792, |
|
"eval_samples_per_second": 16.557, |
|
"eval_steps_per_second": 2.074, |
|
"step": 2772 |
|
}, |
|
{ |
|
"epoch": 12.0, |
|
"learning_rate": 1.5200000000000002e-05, |
|
"loss": 0.0554, |
|
"step": 3024 |
|
}, |
|
{ |
|
"epoch": 12.0, |
|
"eval_accuracy": 0.9138920780711826, |
|
"eval_f1": 0.7228513529622126, |
|
"eval_loss": 0.4619043469429016, |
|
"eval_precision": 0.6864387593389178, |
|
"eval_recall": 0.7633434038267876, |
|
"eval_runtime": 32.0505, |
|
"eval_samples_per_second": 15.694, |
|
"eval_steps_per_second": 1.966, |
|
"step": 3024 |
|
}, |
|
{ |
|
"epoch": 13.0, |
|
"learning_rate": 1.48e-05, |
|
"loss": 0.0468, |
|
"step": 3276 |
|
}, |
|
{ |
|
"epoch": 13.0, |
|
"eval_accuracy": 0.9101840071989326, |
|
"eval_f1": 0.7200470311581422, |
|
"eval_loss": 0.5248007774353027, |
|
"eval_precision": 0.6754908449150673, |
|
"eval_recall": 0.770896273917422, |
|
"eval_runtime": 30.3642, |
|
"eval_samples_per_second": 16.566, |
|
"eval_steps_per_second": 2.075, |
|
"step": 3276 |
|
}, |
|
{ |
|
"epoch": 14.0, |
|
"learning_rate": 1.4400000000000001e-05, |
|
"loss": 0.0416, |
|
"step": 3528 |
|
}, |
|
{ |
|
"epoch": 14.0, |
|
"eval_accuracy": 0.9106649703664629, |
|
"eval_f1": 0.7144713526284701, |
|
"eval_loss": 0.5338897109031677, |
|
"eval_precision": 0.6730469619407968, |
|
"eval_recall": 0.7613293051359517, |
|
"eval_runtime": 30.627, |
|
"eval_samples_per_second": 16.423, |
|
"eval_steps_per_second": 2.057, |
|
"step": 3528 |
|
}, |
|
{ |
|
"epoch": 15.0, |
|
"learning_rate": 1.4e-05, |
|
"loss": 0.0349, |
|
"step": 3780 |
|
}, |
|
{ |
|
"epoch": 15.0, |
|
"eval_accuracy": 0.9078877959474975, |
|
"eval_f1": 0.71319108805847, |
|
"eval_loss": 0.5588390827178955, |
|
"eval_precision": 0.6705830192861894, |
|
"eval_recall": 0.7615810674723061, |
|
"eval_runtime": 30.9024, |
|
"eval_samples_per_second": 16.277, |
|
"eval_steps_per_second": 2.039, |
|
"step": 3780 |
|
}, |
|
{ |
|
"epoch": 16.0, |
|
"learning_rate": 1.3600000000000002e-05, |
|
"loss": 0.0301, |
|
"step": 4032 |
|
}, |
|
{ |
|
"epoch": 16.0, |
|
"eval_accuracy": 0.9083687591150278, |
|
"eval_f1": 0.7168475696083058, |
|
"eval_loss": 0.5909355878829956, |
|
"eval_precision": 0.6745115452930728, |
|
"eval_recall": 0.7648539778449144, |
|
"eval_runtime": 31.5608, |
|
"eval_samples_per_second": 15.938, |
|
"eval_steps_per_second": 1.996, |
|
"step": 4032 |
|
}, |
|
{ |
|
"epoch": 17.0, |
|
"learning_rate": 1.3200000000000002e-05, |
|
"loss": 0.0293, |
|
"step": 4284 |
|
}, |
|
{ |
|
"epoch": 17.0, |
|
"eval_accuracy": 0.9139075930120706, |
|
"eval_f1": 0.7264906201457759, |
|
"eval_loss": 0.557870090007782, |
|
"eval_precision": 0.6913804866954741, |
|
"eval_recall": 0.7653575025176234, |
|
"eval_runtime": 31.1498, |
|
"eval_samples_per_second": 16.148, |
|
"eval_steps_per_second": 2.022, |
|
"step": 4284 |
|
}, |
|
{ |
|
"epoch": 18.0, |
|
"learning_rate": 1.2800000000000001e-05, |
|
"loss": 0.0264, |
|
"step": 4536 |
|
}, |
|
{ |
|
"epoch": 18.0, |
|
"eval_accuracy": 0.9099047382629473, |
|
"eval_f1": 0.7172199665631717, |
|
"eval_loss": 0.5989866256713867, |
|
"eval_precision": 0.682189913675602, |
|
"eval_recall": 0.7560422960725075, |
|
"eval_runtime": 29.8647, |
|
"eval_samples_per_second": 16.843, |
|
"eval_steps_per_second": 2.11, |
|
"step": 4536 |
|
}, |
|
{ |
|
"epoch": 19.0, |
|
"learning_rate": 1.2400000000000002e-05, |
|
"loss": 0.0223, |
|
"step": 4788 |
|
}, |
|
{ |
|
"epoch": 19.0, |
|
"eval_accuracy": 0.9099357681447233, |
|
"eval_f1": 0.718458082062197, |
|
"eval_loss": 0.6070677638053894, |
|
"eval_precision": 0.6773690078037904, |
|
"eval_recall": 0.7648539778449144, |
|
"eval_runtime": 30.5876, |
|
"eval_samples_per_second": 16.445, |
|
"eval_steps_per_second": 2.06, |
|
"step": 4788 |
|
}, |
|
{ |
|
"epoch": 20.0, |
|
"learning_rate": 1.2e-05, |
|
"loss": 0.0195, |
|
"step": 5040 |
|
}, |
|
{ |
|
"epoch": 20.0, |
|
"eval_accuracy": 0.9119992552828373, |
|
"eval_f1": 0.720656439529076, |
|
"eval_loss": 0.6215817928314209, |
|
"eval_precision": 0.68289384719405, |
|
"eval_recall": 0.7628398791540786, |
|
"eval_runtime": 30.3859, |
|
"eval_samples_per_second": 16.554, |
|
"eval_steps_per_second": 2.073, |
|
"step": 5040 |
|
}, |
|
{ |
|
"epoch": 21.0, |
|
"learning_rate": 1.16e-05, |
|
"loss": 0.0181, |
|
"step": 5292 |
|
}, |
|
{ |
|
"epoch": 21.0, |
|
"eval_accuracy": 0.9089428119278865, |
|
"eval_f1": 0.7139341380522678, |
|
"eval_loss": 0.6391084790229797, |
|
"eval_precision": 0.6678360008770007, |
|
"eval_recall": 0.7668680765357503, |
|
"eval_runtime": 31.753, |
|
"eval_samples_per_second": 15.841, |
|
"eval_steps_per_second": 1.984, |
|
"step": 5292 |
|
}, |
|
{ |
|
"epoch": 22.0, |
|
"learning_rate": 1.1200000000000001e-05, |
|
"loss": 0.016, |
|
"step": 5544 |
|
}, |
|
{ |
|
"epoch": 22.0, |
|
"eval_accuracy": 0.9129766965587861, |
|
"eval_f1": 0.7200477326968974, |
|
"eval_loss": 0.6382994055747986, |
|
"eval_precision": 0.684437386569873, |
|
"eval_recall": 0.7595669687814703, |
|
"eval_runtime": 30.7224, |
|
"eval_samples_per_second": 16.372, |
|
"eval_steps_per_second": 2.051, |
|
"step": 5544 |
|
}, |
|
{ |
|
"epoch": 23.0, |
|
"learning_rate": 1.0800000000000002e-05, |
|
"loss": 0.0153, |
|
"step": 5796 |
|
}, |
|
{ |
|
"epoch": 23.0, |
|
"eval_accuracy": 0.9136903838396375, |
|
"eval_f1": 0.7225759942328487, |
|
"eval_loss": 0.6503807902336121, |
|
"eval_precision": 0.6911054929901173, |
|
"eval_recall": 0.7570493454179255, |
|
"eval_runtime": 30.4671, |
|
"eval_samples_per_second": 16.51, |
|
"eval_steps_per_second": 2.068, |
|
"step": 5796 |
|
}, |
|
{ |
|
"epoch": 24.0, |
|
"learning_rate": 1.04e-05, |
|
"loss": 0.0135, |
|
"step": 6048 |
|
}, |
|
{ |
|
"epoch": 24.0, |
|
"eval_accuracy": 0.911083873770441, |
|
"eval_f1": 0.7179244165383247, |
|
"eval_loss": 0.6738658547401428, |
|
"eval_precision": 0.6780040277466994, |
|
"eval_recall": 0.7628398791540786, |
|
"eval_runtime": 31.8247, |
|
"eval_samples_per_second": 15.805, |
|
"eval_steps_per_second": 1.98, |
|
"step": 6048 |
|
}, |
|
{ |
|
"epoch": 25.0, |
|
"learning_rate": 1e-05, |
|
"loss": 0.0103, |
|
"step": 6300 |
|
}, |
|
{ |
|
"epoch": 25.0, |
|
"eval_accuracy": 0.9127284575045769, |
|
"eval_f1": 0.7242580800192239, |
|
"eval_loss": 0.677778422832489, |
|
"eval_precision": 0.6927143185474604, |
|
"eval_recall": 0.7588116817724069, |
|
"eval_runtime": 31.5342, |
|
"eval_samples_per_second": 15.951, |
|
"eval_steps_per_second": 1.998, |
|
"step": 6300 |
|
}, |
|
{ |
|
"epoch": 26.0, |
|
"learning_rate": 9.600000000000001e-06, |
|
"loss": 0.0109, |
|
"step": 6552 |
|
}, |
|
{ |
|
"epoch": 26.0, |
|
"eval_accuracy": 0.9117665311695162, |
|
"eval_f1": 0.7213822894168466, |
|
"eval_loss": 0.6734189987182617, |
|
"eval_precision": 0.6891334250343879, |
|
"eval_recall": 0.756797583081571, |
|
"eval_runtime": 30.9002, |
|
"eval_samples_per_second": 16.278, |
|
"eval_steps_per_second": 2.039, |
|
"step": 6552 |
|
}, |
|
{ |
|
"epoch": 27.0, |
|
"learning_rate": 9.200000000000002e-06, |
|
"loss": 0.0097, |
|
"step": 6804 |
|
}, |
|
{ |
|
"epoch": 27.0, |
|
"eval_accuracy": 0.9124647035094796, |
|
"eval_f1": 0.7231973434535104, |
|
"eval_loss": 0.6837841272354126, |
|
"eval_precision": 0.6836322869955157, |
|
"eval_recall": 0.7676233635448136, |
|
"eval_runtime": 30.4438, |
|
"eval_samples_per_second": 16.522, |
|
"eval_steps_per_second": 2.069, |
|
"step": 6804 |
|
}, |
|
{ |
|
"epoch": 28.0, |
|
"learning_rate": 8.8e-06, |
|
"loss": 0.0092, |
|
"step": 7056 |
|
}, |
|
{ |
|
"epoch": 28.0, |
|
"eval_accuracy": 0.9118130759921804, |
|
"eval_f1": 0.7228887320630439, |
|
"eval_loss": 0.7063636183738708, |
|
"eval_precision": 0.6783664459161148, |
|
"eval_recall": 0.7736656596173213, |
|
"eval_runtime": 32.0989, |
|
"eval_samples_per_second": 15.67, |
|
"eval_steps_per_second": 1.963, |
|
"step": 7056 |
|
}, |
|
{ |
|
"epoch": 29.0, |
|
"learning_rate": 8.400000000000001e-06, |
|
"loss": 0.0079, |
|
"step": 7308 |
|
}, |
|
{ |
|
"epoch": 29.0, |
|
"eval_accuracy": 0.9113941725882024, |
|
"eval_f1": 0.7218511450381679, |
|
"eval_loss": 0.6944219470024109, |
|
"eval_precision": 0.685856754306437, |
|
"eval_recall": 0.7618328298086606, |
|
"eval_runtime": 31.0056, |
|
"eval_samples_per_second": 16.223, |
|
"eval_steps_per_second": 2.032, |
|
"step": 7308 |
|
}, |
|
{ |
|
"epoch": 30.0, |
|
"learning_rate": 8.000000000000001e-06, |
|
"loss": 0.0078, |
|
"step": 7560 |
|
}, |
|
{ |
|
"epoch": 30.0, |
|
"eval_accuracy": 0.9092220808638719, |
|
"eval_f1": 0.717688679245283, |
|
"eval_loss": 0.7390450835227966, |
|
"eval_precision": 0.6750221827861579, |
|
"eval_recall": 0.7661127895266868, |
|
"eval_runtime": 32.0929, |
|
"eval_samples_per_second": 15.673, |
|
"eval_steps_per_second": 1.963, |
|
"step": 7560 |
|
}, |
|
{ |
|
"epoch": 31.0, |
|
"learning_rate": 7.600000000000001e-06, |
|
"loss": 0.0066, |
|
"step": 7812 |
|
}, |
|
{ |
|
"epoch": 31.0, |
|
"eval_accuracy": 0.9112235082384336, |
|
"eval_f1": 0.7232323232323231, |
|
"eval_loss": 0.7528515458106995, |
|
"eval_precision": 0.6848975917173081, |
|
"eval_recall": 0.7661127895266868, |
|
"eval_runtime": 31.1215, |
|
"eval_samples_per_second": 16.162, |
|
"eval_steps_per_second": 2.024, |
|
"step": 7812 |
|
}, |
|
{ |
|
"epoch": 32.0, |
|
"learning_rate": 7.2000000000000005e-06, |
|
"loss": 0.0061, |
|
"step": 8064 |
|
}, |
|
{ |
|
"epoch": 32.0, |
|
"eval_accuracy": 0.9128680919725696, |
|
"eval_f1": 0.7292161520190024, |
|
"eval_loss": 0.7525067925453186, |
|
"eval_precision": 0.6901978417266187, |
|
"eval_recall": 0.7729103726082578, |
|
"eval_runtime": 30.5355, |
|
"eval_samples_per_second": 16.473, |
|
"eval_steps_per_second": 2.063, |
|
"step": 8064 |
|
}, |
|
{ |
|
"epoch": 33.0, |
|
"learning_rate": 6.800000000000001e-06, |
|
"loss": 0.005, |
|
"step": 8316 |
|
}, |
|
{ |
|
"epoch": 33.0, |
|
"eval_accuracy": 0.9131939057312192, |
|
"eval_f1": 0.7289473684210527, |
|
"eval_loss": 0.7354016304016113, |
|
"eval_precision": 0.6943938012762079, |
|
"eval_recall": 0.7671198388721048, |
|
"eval_runtime": 30.6675, |
|
"eval_samples_per_second": 16.402, |
|
"eval_steps_per_second": 2.054, |
|
"step": 8316 |
|
}, |
|
{ |
|
"epoch": 34.0, |
|
"learning_rate": 6.4000000000000006e-06, |
|
"loss": 0.0059, |
|
"step": 8568 |
|
}, |
|
{ |
|
"epoch": 34.0, |
|
"eval_accuracy": 0.9108666645980079, |
|
"eval_f1": 0.723687336659539, |
|
"eval_loss": 0.7652931809425354, |
|
"eval_precision": 0.6851102114260009, |
|
"eval_recall": 0.7668680765357503, |
|
"eval_runtime": 31.9436, |
|
"eval_samples_per_second": 15.747, |
|
"eval_steps_per_second": 1.972, |
|
"step": 8568 |
|
}, |
|
{ |
|
"epoch": 35.0, |
|
"learning_rate": 6e-06, |
|
"loss": 0.0047, |
|
"step": 8820 |
|
}, |
|
{ |
|
"epoch": 35.0, |
|
"eval_accuracy": 0.9116113817606355, |
|
"eval_f1": 0.7277705035114866, |
|
"eval_loss": 0.7705232501029968, |
|
"eval_precision": 0.6902235267554753, |
|
"eval_recall": 0.7696374622356495, |
|
"eval_runtime": 30.572, |
|
"eval_samples_per_second": 16.453, |
|
"eval_steps_per_second": 2.061, |
|
"step": 8820 |
|
}, |
|
{ |
|
"epoch": 36.0, |
|
"learning_rate": 5.600000000000001e-06, |
|
"loss": 0.0049, |
|
"step": 9072 |
|
}, |
|
{ |
|
"epoch": 36.0, |
|
"eval_accuracy": 0.9124336736277034, |
|
"eval_f1": 0.7295733911785972, |
|
"eval_loss": 0.7525166273117065, |
|
"eval_precision": 0.6997226074895978, |
|
"eval_recall": 0.7620845921450151, |
|
"eval_runtime": 30.7353, |
|
"eval_samples_per_second": 16.366, |
|
"eval_steps_per_second": 2.05, |
|
"step": 9072 |
|
} |
|
], |
|
"logging_steps": 500, |
|
"max_steps": 12600, |
|
"num_train_epochs": 50, |
|
"save_steps": 500, |
|
"total_flos": 3.469062692905536e+16, |
|
"trial_name": null, |
|
"trial_params": null |
|
} |
|
|