paul
End of training
351d245
raw
history blame
No virus
37.4 kB
{
"best_metric": 0.8440366972477065,
"best_model_checkpoint": "microsoft-resnet-50-cartoon-emotion-detection/checkpoint-528",
"epoch": 79.96969696969697,
"global_step": 640,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 0.97,
"eval_accuracy": 0.22935779816513763,
"eval_f1": 0.21647331951741566,
"eval_loss": 1.3854628801345825,
"eval_precision": 0.2697355008315897,
"eval_recall": 0.22935779816513763,
"eval_runtime": 6.0845,
"eval_samples_per_second": 17.914,
"eval_steps_per_second": 0.329,
"step": 8
},
{
"epoch": 1.24,
"learning_rate": 1.8750000000000002e-05,
"loss": 1.4222,
"step": 10
},
{
"epoch": 1.97,
"eval_accuracy": 0.25688073394495414,
"eval_f1": 0.25434987070599063,
"eval_loss": 1.3791918754577637,
"eval_precision": 0.2807708571335123,
"eval_recall": 0.25688073394495414,
"eval_runtime": 4.2925,
"eval_samples_per_second": 25.393,
"eval_steps_per_second": 0.466,
"step": 16
},
{
"epoch": 2.48,
"learning_rate": 3.7500000000000003e-05,
"loss": 1.4183,
"step": 20
},
{
"epoch": 2.97,
"eval_accuracy": 0.3853211009174312,
"eval_f1": 0.3511144563688655,
"eval_loss": 1.3646042346954346,
"eval_precision": 0.4102155235182758,
"eval_recall": 0.3853211009174312,
"eval_runtime": 4.3579,
"eval_samples_per_second": 25.012,
"eval_steps_per_second": 0.459,
"step": 24
},
{
"epoch": 3.73,
"learning_rate": 5.625e-05,
"loss": 1.4097,
"step": 30
},
{
"epoch": 3.97,
"eval_accuracy": 0.41284403669724773,
"eval_f1": 0.32452248836490605,
"eval_loss": 1.3562716245651245,
"eval_precision": 0.5062447369587377,
"eval_recall": 0.41284403669724773,
"eval_runtime": 4.3612,
"eval_samples_per_second": 24.993,
"eval_steps_per_second": 0.459,
"step": 32
},
{
"epoch": 4.97,
"learning_rate": 7.500000000000001e-05,
"loss": 1.3944,
"step": 40
},
{
"epoch": 4.97,
"eval_accuracy": 0.4036697247706422,
"eval_f1": 0.293905028882093,
"eval_loss": 1.3461558818817139,
"eval_precision": 0.3927443217900042,
"eval_recall": 0.4036697247706422,
"eval_runtime": 4.4159,
"eval_samples_per_second": 24.684,
"eval_steps_per_second": 0.453,
"step": 40
},
{
"epoch": 5.97,
"eval_accuracy": 0.4036697247706422,
"eval_f1": 0.2840541721275666,
"eval_loss": 1.322252631187439,
"eval_precision": 0.5152005756431013,
"eval_recall": 0.4036697247706422,
"eval_runtime": 4.2725,
"eval_samples_per_second": 25.512,
"eval_steps_per_second": 0.468,
"step": 48
},
{
"epoch": 6.24,
"learning_rate": 9.375e-05,
"loss": 1.411,
"step": 50
},
{
"epoch": 6.97,
"eval_accuracy": 0.41284403669724773,
"eval_f1": 0.29851761513413444,
"eval_loss": 1.304025411605835,
"eval_precision": 0.44039013993142434,
"eval_recall": 0.41284403669724773,
"eval_runtime": 4.4737,
"eval_samples_per_second": 24.365,
"eval_steps_per_second": 0.447,
"step": 56
},
{
"epoch": 7.48,
"learning_rate": 0.0001125,
"loss": 1.346,
"step": 60
},
{
"epoch": 7.97,
"eval_accuracy": 0.4954128440366973,
"eval_f1": 0.4092687533729088,
"eval_loss": 1.2699785232543945,
"eval_precision": 0.49603902723168775,
"eval_recall": 0.4954128440366973,
"eval_runtime": 4.5079,
"eval_samples_per_second": 24.18,
"eval_steps_per_second": 0.444,
"step": 64
},
{
"epoch": 8.73,
"learning_rate": 0.00011875000000000001,
"loss": 1.3031,
"step": 70
},
{
"epoch": 8.97,
"eval_accuracy": 0.5596330275229358,
"eval_f1": 0.46723852012270245,
"eval_loss": 1.2149937152862549,
"eval_precision": 0.5440134711415631,
"eval_recall": 0.5596330275229358,
"eval_runtime": 4.3712,
"eval_samples_per_second": 24.936,
"eval_steps_per_second": 0.458,
"step": 72
},
{
"epoch": 9.97,
"learning_rate": 0.00011666666666666667,
"loss": 1.2371,
"step": 80
},
{
"epoch": 9.97,
"eval_accuracy": 0.5963302752293578,
"eval_f1": 0.5100508405791544,
"eval_loss": 1.1580270528793335,
"eval_precision": 0.5659333353788879,
"eval_recall": 0.5963302752293578,
"eval_runtime": 4.2133,
"eval_samples_per_second": 25.87,
"eval_steps_per_second": 0.475,
"step": 80
},
{
"epoch": 10.97,
"eval_accuracy": 0.6055045871559633,
"eval_f1": 0.5211004609031267,
"eval_loss": 1.066982388496399,
"eval_precision": 0.7279186904119446,
"eval_recall": 0.6055045871559633,
"eval_runtime": 14.5277,
"eval_samples_per_second": 7.503,
"eval_steps_per_second": 0.138,
"step": 88
},
{
"epoch": 11.24,
"learning_rate": 0.00011458333333333334,
"loss": 1.1736,
"step": 90
},
{
"epoch": 11.97,
"eval_accuracy": 0.6605504587155964,
"eval_f1": 0.5771675777046106,
"eval_loss": 0.9855989813804626,
"eval_precision": 0.5536726213674042,
"eval_recall": 0.6605504587155964,
"eval_runtime": 4.2828,
"eval_samples_per_second": 25.451,
"eval_steps_per_second": 0.467,
"step": 96
},
{
"epoch": 12.48,
"learning_rate": 0.0001125,
"loss": 1.0457,
"step": 100
},
{
"epoch": 12.97,
"eval_accuracy": 0.6697247706422018,
"eval_f1": 0.5964926350313968,
"eval_loss": 0.896264374256134,
"eval_precision": 0.763141515721791,
"eval_recall": 0.6697247706422018,
"eval_runtime": 4.2315,
"eval_samples_per_second": 25.759,
"eval_steps_per_second": 0.473,
"step": 104
},
{
"epoch": 13.73,
"learning_rate": 0.00011041666666666666,
"loss": 0.953,
"step": 110
},
{
"epoch": 13.97,
"eval_accuracy": 0.6697247706422018,
"eval_f1": 0.6081464096911078,
"eval_loss": 0.8546512722969055,
"eval_precision": 0.6884856947005512,
"eval_recall": 0.6697247706422018,
"eval_runtime": 4.4534,
"eval_samples_per_second": 24.476,
"eval_steps_per_second": 0.449,
"step": 112
},
{
"epoch": 14.97,
"learning_rate": 0.00010833333333333334,
"loss": 0.8579,
"step": 120
},
{
"epoch": 14.97,
"eval_accuracy": 0.7155963302752294,
"eval_f1": 0.6643295304342026,
"eval_loss": 0.7848823070526123,
"eval_precision": 0.7396182317656428,
"eval_recall": 0.7155963302752294,
"eval_runtime": 4.1662,
"eval_samples_per_second": 26.163,
"eval_steps_per_second": 0.48,
"step": 120
},
{
"epoch": 15.97,
"eval_accuracy": 0.7431192660550459,
"eval_f1": 0.711852075310986,
"eval_loss": 0.7563745379447937,
"eval_precision": 0.7371817784661822,
"eval_recall": 0.7431192660550459,
"eval_runtime": 4.2674,
"eval_samples_per_second": 25.542,
"eval_steps_per_second": 0.469,
"step": 128
},
{
"epoch": 16.24,
"learning_rate": 0.00010625,
"loss": 0.8167,
"step": 130
},
{
"epoch": 16.97,
"eval_accuracy": 0.7614678899082569,
"eval_f1": 0.7210716889645992,
"eval_loss": 0.7132583260536194,
"eval_precision": 0.7506553079947577,
"eval_recall": 0.7614678899082569,
"eval_runtime": 4.1418,
"eval_samples_per_second": 26.317,
"eval_steps_per_second": 0.483,
"step": 136
},
{
"epoch": 17.48,
"learning_rate": 0.00010416666666666667,
"loss": 0.7273,
"step": 140
},
{
"epoch": 17.97,
"eval_accuracy": 0.7522935779816514,
"eval_f1": 0.7202155642522615,
"eval_loss": 0.6887747645378113,
"eval_precision": 0.7378685592291271,
"eval_recall": 0.7522935779816514,
"eval_runtime": 4.5118,
"eval_samples_per_second": 24.159,
"eval_steps_per_second": 0.443,
"step": 144
},
{
"epoch": 18.73,
"learning_rate": 0.00010208333333333334,
"loss": 0.6547,
"step": 150
},
{
"epoch": 18.97,
"eval_accuracy": 0.7798165137614679,
"eval_f1": 0.7576525411387797,
"eval_loss": 0.659186065196991,
"eval_precision": 0.7772903701802784,
"eval_recall": 0.7798165137614679,
"eval_runtime": 4.3816,
"eval_samples_per_second": 24.877,
"eval_steps_per_second": 0.456,
"step": 152
},
{
"epoch": 19.97,
"learning_rate": 0.0001,
"loss": 0.5963,
"step": 160
},
{
"epoch": 19.97,
"eval_accuracy": 0.7706422018348624,
"eval_f1": 0.7550663564666461,
"eval_loss": 0.6136144399642944,
"eval_precision": 0.764159781184113,
"eval_recall": 0.7706422018348624,
"eval_runtime": 4.2561,
"eval_samples_per_second": 25.61,
"eval_steps_per_second": 0.47,
"step": 160
},
{
"epoch": 20.97,
"eval_accuracy": 0.7889908256880734,
"eval_f1": 0.7786916064255194,
"eval_loss": 0.5723462700843811,
"eval_precision": 0.7801645588430826,
"eval_recall": 0.7889908256880734,
"eval_runtime": 5.2546,
"eval_samples_per_second": 20.744,
"eval_steps_per_second": 0.381,
"step": 168
},
{
"epoch": 21.24,
"learning_rate": 9.791666666666667e-05,
"loss": 0.551,
"step": 170
},
{
"epoch": 21.97,
"eval_accuracy": 0.7889908256880734,
"eval_f1": 0.7780894219567608,
"eval_loss": 0.5686229467391968,
"eval_precision": 0.776092121476891,
"eval_recall": 0.7889908256880734,
"eval_runtime": 4.3144,
"eval_samples_per_second": 25.264,
"eval_steps_per_second": 0.464,
"step": 176
},
{
"epoch": 22.48,
"learning_rate": 9.583333333333334e-05,
"loss": 0.4929,
"step": 180
},
{
"epoch": 22.97,
"eval_accuracy": 0.7706422018348624,
"eval_f1": 0.7651464296127533,
"eval_loss": 0.5596823692321777,
"eval_precision": 0.7649127896435436,
"eval_recall": 0.7706422018348624,
"eval_runtime": 4.4326,
"eval_samples_per_second": 24.59,
"eval_steps_per_second": 0.451,
"step": 184
},
{
"epoch": 23.73,
"learning_rate": 9.375e-05,
"loss": 0.4309,
"step": 190
},
{
"epoch": 23.97,
"eval_accuracy": 0.7889908256880734,
"eval_f1": 0.781022184850044,
"eval_loss": 0.5233965516090393,
"eval_precision": 0.7774110647118855,
"eval_recall": 0.7889908256880734,
"eval_runtime": 4.3167,
"eval_samples_per_second": 25.251,
"eval_steps_per_second": 0.463,
"step": 192
},
{
"epoch": 24.97,
"learning_rate": 9.166666666666667e-05,
"loss": 0.3945,
"step": 200
},
{
"epoch": 24.97,
"eval_accuracy": 0.7889908256880734,
"eval_f1": 0.7812909567496724,
"eval_loss": 0.5007840991020203,
"eval_precision": 0.7836723839914905,
"eval_recall": 0.7889908256880734,
"eval_runtime": 4.3513,
"eval_samples_per_second": 25.05,
"eval_steps_per_second": 0.46,
"step": 200
},
{
"epoch": 25.97,
"eval_accuracy": 0.7522935779816514,
"eval_f1": 0.7528893125223401,
"eval_loss": 0.5289302468299866,
"eval_precision": 0.7537344154316632,
"eval_recall": 0.7522935779816514,
"eval_runtime": 4.3647,
"eval_samples_per_second": 24.973,
"eval_steps_per_second": 0.458,
"step": 208
},
{
"epoch": 26.24,
"learning_rate": 8.958333333333333e-05,
"loss": 0.3704,
"step": 210
},
{
"epoch": 26.97,
"eval_accuracy": 0.7981651376146789,
"eval_f1": 0.7962706746091569,
"eval_loss": 0.4399118423461914,
"eval_precision": 0.7957732392169626,
"eval_recall": 0.7981651376146789,
"eval_runtime": 4.2147,
"eval_samples_per_second": 25.862,
"eval_steps_per_second": 0.475,
"step": 216
},
{
"epoch": 27.48,
"learning_rate": 8.75e-05,
"loss": 0.3267,
"step": 220
},
{
"epoch": 27.97,
"eval_accuracy": 0.8073394495412844,
"eval_f1": 0.8005365278178692,
"eval_loss": 0.4539415240287781,
"eval_precision": 0.7983420088683247,
"eval_recall": 0.8073394495412844,
"eval_runtime": 4.2272,
"eval_samples_per_second": 25.785,
"eval_steps_per_second": 0.473,
"step": 224
},
{
"epoch": 28.73,
"learning_rate": 8.541666666666668e-05,
"loss": 0.2966,
"step": 230
},
{
"epoch": 28.97,
"eval_accuracy": 0.7798165137614679,
"eval_f1": 0.7837137974455839,
"eval_loss": 0.4734969735145569,
"eval_precision": 0.789241175758926,
"eval_recall": 0.7798165137614679,
"eval_runtime": 4.2368,
"eval_samples_per_second": 25.727,
"eval_steps_per_second": 0.472,
"step": 232
},
{
"epoch": 29.97,
"learning_rate": 8.333333333333333e-05,
"loss": 0.2645,
"step": 240
},
{
"epoch": 29.97,
"eval_accuracy": 0.7706422018348624,
"eval_f1": 0.7706422018348624,
"eval_loss": 0.4594463109970093,
"eval_precision": 0.7706422018348624,
"eval_recall": 0.7706422018348624,
"eval_runtime": 4.3943,
"eval_samples_per_second": 24.805,
"eval_steps_per_second": 0.455,
"step": 240
},
{
"epoch": 30.97,
"eval_accuracy": 0.7522935779816514,
"eval_f1": 0.7533140030125614,
"eval_loss": 0.4698648750782013,
"eval_precision": 0.7554437319096274,
"eval_recall": 0.7522935779816514,
"eval_runtime": 4.1296,
"eval_samples_per_second": 26.394,
"eval_steps_per_second": 0.484,
"step": 248
},
{
"epoch": 31.24,
"learning_rate": 8.125000000000001e-05,
"loss": 0.2527,
"step": 250
},
{
"epoch": 31.97,
"eval_accuracy": 0.7889908256880734,
"eval_f1": 0.7856523955147808,
"eval_loss": 0.45513755083084106,
"eval_precision": 0.785609816323817,
"eval_recall": 0.7889908256880734,
"eval_runtime": 4.1348,
"eval_samples_per_second": 26.361,
"eval_steps_per_second": 0.484,
"step": 256
},
{
"epoch": 32.48,
"learning_rate": 7.916666666666666e-05,
"loss": 0.2202,
"step": 260
},
{
"epoch": 32.97,
"eval_accuracy": 0.8165137614678899,
"eval_f1": 0.8170336224601304,
"eval_loss": 0.4457748532295227,
"eval_precision": 0.8197900424266599,
"eval_recall": 0.8165137614678899,
"eval_runtime": 5.1689,
"eval_samples_per_second": 21.087,
"eval_steps_per_second": 0.387,
"step": 264
},
{
"epoch": 33.73,
"learning_rate": 7.708333333333334e-05,
"loss": 0.2006,
"step": 270
},
{
"epoch": 33.97,
"eval_accuracy": 0.7798165137614679,
"eval_f1": 0.7850412357933325,
"eval_loss": 0.46321260929107666,
"eval_precision": 0.7940749153601442,
"eval_recall": 0.7798165137614679,
"eval_runtime": 4.2326,
"eval_samples_per_second": 25.752,
"eval_steps_per_second": 0.473,
"step": 272
},
{
"epoch": 34.97,
"learning_rate": 7.500000000000001e-05,
"loss": 0.1589,
"step": 280
},
{
"epoch": 34.97,
"eval_accuracy": 0.7889908256880734,
"eval_f1": 0.7925041274199247,
"eval_loss": 0.46511203050613403,
"eval_precision": 0.7993275970140749,
"eval_recall": 0.7889908256880734,
"eval_runtime": 4.1566,
"eval_samples_per_second": 26.223,
"eval_steps_per_second": 0.481,
"step": 280
},
{
"epoch": 35.97,
"eval_accuracy": 0.7798165137614679,
"eval_f1": 0.7803733958918072,
"eval_loss": 0.45948973298072815,
"eval_precision": 0.7823930357635982,
"eval_recall": 0.7798165137614679,
"eval_runtime": 4.3202,
"eval_samples_per_second": 25.23,
"eval_steps_per_second": 0.463,
"step": 288
},
{
"epoch": 36.24,
"learning_rate": 7.291666666666666e-05,
"loss": 0.153,
"step": 290
},
{
"epoch": 36.97,
"eval_accuracy": 0.7614678899082569,
"eval_f1": 0.7632546001327497,
"eval_loss": 0.458363801240921,
"eval_precision": 0.7690950187958565,
"eval_recall": 0.7614678899082569,
"eval_runtime": 4.4275,
"eval_samples_per_second": 24.619,
"eval_steps_per_second": 0.452,
"step": 296
},
{
"epoch": 37.48,
"learning_rate": 7.083333333333334e-05,
"loss": 0.1427,
"step": 300
},
{
"epoch": 37.97,
"eval_accuracy": 0.7798165137614679,
"eval_f1": 0.7796360891921739,
"eval_loss": 0.46078726649284363,
"eval_precision": 0.782995656118911,
"eval_recall": 0.7798165137614679,
"eval_runtime": 4.4461,
"eval_samples_per_second": 24.516,
"eval_steps_per_second": 0.45,
"step": 304
},
{
"epoch": 38.73,
"learning_rate": 6.874999999999999e-05,
"loss": 0.113,
"step": 310
},
{
"epoch": 38.97,
"eval_accuracy": 0.7889908256880734,
"eval_f1": 0.7898954921921011,
"eval_loss": 0.45713570713996887,
"eval_precision": 0.7922270390160299,
"eval_recall": 0.7889908256880734,
"eval_runtime": 4.3087,
"eval_samples_per_second": 25.297,
"eval_steps_per_second": 0.464,
"step": 312
},
{
"epoch": 39.97,
"learning_rate": 6.666666666666667e-05,
"loss": 0.1146,
"step": 320
},
{
"epoch": 39.97,
"eval_accuracy": 0.7614678899082569,
"eval_f1": 0.7612891030218949,
"eval_loss": 0.5269873142242432,
"eval_precision": 0.765128347697155,
"eval_recall": 0.7614678899082569,
"eval_runtime": 4.2908,
"eval_samples_per_second": 25.403,
"eval_steps_per_second": 0.466,
"step": 320
},
{
"epoch": 40.97,
"eval_accuracy": 0.7706422018348624,
"eval_f1": 0.7709516996486127,
"eval_loss": 0.48878130316734314,
"eval_precision": 0.7781771515945828,
"eval_recall": 0.7706422018348624,
"eval_runtime": 4.3303,
"eval_samples_per_second": 25.171,
"eval_steps_per_second": 0.462,
"step": 328
},
{
"epoch": 41.24,
"learning_rate": 6.458333333333334e-05,
"loss": 0.1275,
"step": 330
},
{
"epoch": 41.97,
"eval_accuracy": 0.7889908256880734,
"eval_f1": 0.7836706749228535,
"eval_loss": 0.4523099958896637,
"eval_precision": 0.780905883107718,
"eval_recall": 0.7889908256880734,
"eval_runtime": 4.2033,
"eval_samples_per_second": 25.932,
"eval_steps_per_second": 0.476,
"step": 336
},
{
"epoch": 42.48,
"learning_rate": 6.25e-05,
"loss": 0.0959,
"step": 340
},
{
"epoch": 42.97,
"eval_accuracy": 0.7798165137614679,
"eval_f1": 0.7767063396275014,
"eval_loss": 0.46965503692626953,
"eval_precision": 0.7753268138589239,
"eval_recall": 0.7798165137614679,
"eval_runtime": 4.3242,
"eval_samples_per_second": 25.207,
"eval_steps_per_second": 0.463,
"step": 344
},
{
"epoch": 43.73,
"learning_rate": 6.041666666666667e-05,
"loss": 0.0882,
"step": 350
},
{
"epoch": 43.97,
"eval_accuracy": 0.7706422018348624,
"eval_f1": 0.7685729724992435,
"eval_loss": 0.4286104738712311,
"eval_precision": 0.7685932721712537,
"eval_recall": 0.7706422018348624,
"eval_runtime": 4.4175,
"eval_samples_per_second": 24.675,
"eval_steps_per_second": 0.453,
"step": 352
},
{
"epoch": 44.97,
"learning_rate": 5.833333333333333e-05,
"loss": 0.0847,
"step": 360
},
{
"epoch": 44.97,
"eval_accuracy": 0.7889908256880734,
"eval_f1": 0.7925041274199247,
"eval_loss": 0.5317460298538208,
"eval_precision": 0.7993275970140749,
"eval_recall": 0.7889908256880734,
"eval_runtime": 6.0042,
"eval_samples_per_second": 18.154,
"eval_steps_per_second": 0.333,
"step": 360
},
{
"epoch": 45.97,
"eval_accuracy": 0.7614678899082569,
"eval_f1": 0.7646893115457605,
"eval_loss": 0.5431071519851685,
"eval_precision": 0.7699552364490537,
"eval_recall": 0.7614678899082569,
"eval_runtime": 4.3547,
"eval_samples_per_second": 25.03,
"eval_steps_per_second": 0.459,
"step": 368
},
{
"epoch": 46.24,
"learning_rate": 5.625e-05,
"loss": 0.0813,
"step": 370
},
{
"epoch": 46.97,
"eval_accuracy": 0.8256880733944955,
"eval_f1": 0.8284158367266842,
"eval_loss": 0.44316479563713074,
"eval_precision": 0.843538901662607,
"eval_recall": 0.8256880733944955,
"eval_runtime": 4.2714,
"eval_samples_per_second": 25.519,
"eval_steps_per_second": 0.468,
"step": 376
},
{
"epoch": 47.48,
"learning_rate": 5.416666666666667e-05,
"loss": 0.0768,
"step": 380
},
{
"epoch": 47.97,
"eval_accuracy": 0.7981651376146789,
"eval_f1": 0.7955546490941502,
"eval_loss": 0.4885597229003906,
"eval_precision": 0.8005162605636117,
"eval_recall": 0.7981651376146789,
"eval_runtime": 4.2576,
"eval_samples_per_second": 25.602,
"eval_steps_per_second": 0.47,
"step": 384
},
{
"epoch": 48.73,
"learning_rate": 5.208333333333334e-05,
"loss": 0.0627,
"step": 390
},
{
"epoch": 48.97,
"eval_accuracy": 0.7981651376146789,
"eval_f1": 0.8009727230444837,
"eval_loss": 0.5372528433799744,
"eval_precision": 0.8071912929511652,
"eval_recall": 0.7981651376146789,
"eval_runtime": 4.3763,
"eval_samples_per_second": 24.907,
"eval_steps_per_second": 0.457,
"step": 392
},
{
"epoch": 49.97,
"learning_rate": 5e-05,
"loss": 0.0688,
"step": 400
},
{
"epoch": 49.97,
"eval_accuracy": 0.7798165137614679,
"eval_f1": 0.7822443312570955,
"eval_loss": 0.5896694660186768,
"eval_precision": 0.789232725399693,
"eval_recall": 0.7798165137614679,
"eval_runtime": 4.3692,
"eval_samples_per_second": 24.947,
"eval_steps_per_second": 0.458,
"step": 400
},
{
"epoch": 50.97,
"eval_accuracy": 0.7981651376146789,
"eval_f1": 0.7992371326578404,
"eval_loss": 0.5114642977714539,
"eval_precision": 0.8014849021031709,
"eval_recall": 0.7981651376146789,
"eval_runtime": 4.3028,
"eval_samples_per_second": 25.332,
"eval_steps_per_second": 0.465,
"step": 408
},
{
"epoch": 51.24,
"learning_rate": 4.791666666666667e-05,
"loss": 0.0676,
"step": 410
},
{
"epoch": 51.97,
"eval_accuracy": 0.7981651376146789,
"eval_f1": 0.7977993643940755,
"eval_loss": 0.4881470799446106,
"eval_precision": 0.7998301588132414,
"eval_recall": 0.7981651376146789,
"eval_runtime": 4.3212,
"eval_samples_per_second": 25.224,
"eval_steps_per_second": 0.463,
"step": 416
},
{
"epoch": 52.48,
"learning_rate": 4.5833333333333334e-05,
"loss": 0.0539,
"step": 420
},
{
"epoch": 52.97,
"eval_accuracy": 0.8073394495412844,
"eval_f1": 0.807691055721277,
"eval_loss": 0.4819609224796295,
"eval_precision": 0.8138503399273244,
"eval_recall": 0.8073394495412844,
"eval_runtime": 4.3125,
"eval_samples_per_second": 25.276,
"eval_steps_per_second": 0.464,
"step": 424
},
{
"epoch": 53.73,
"learning_rate": 4.375e-05,
"loss": 0.0596,
"step": 430
},
{
"epoch": 53.97,
"eval_accuracy": 0.8256880733944955,
"eval_f1": 0.8244465797713664,
"eval_loss": 0.4449571669101715,
"eval_precision": 0.8245908379614004,
"eval_recall": 0.8256880733944955,
"eval_runtime": 5.8195,
"eval_samples_per_second": 18.73,
"eval_steps_per_second": 0.344,
"step": 432
},
{
"epoch": 54.97,
"learning_rate": 4.1666666666666665e-05,
"loss": 0.0611,
"step": 440
},
{
"epoch": 54.97,
"eval_accuracy": 0.7889908256880734,
"eval_f1": 0.7924465793472197,
"eval_loss": 0.5057494044303894,
"eval_precision": 0.8008019735410222,
"eval_recall": 0.7889908256880734,
"eval_runtime": 4.6616,
"eval_samples_per_second": 23.383,
"eval_steps_per_second": 0.429,
"step": 440
},
{
"epoch": 55.97,
"eval_accuracy": 0.7981651376146789,
"eval_f1": 0.8008031371900772,
"eval_loss": 0.4918478727340698,
"eval_precision": 0.8056331161636306,
"eval_recall": 0.7981651376146789,
"eval_runtime": 4.8639,
"eval_samples_per_second": 22.41,
"eval_steps_per_second": 0.411,
"step": 448
},
{
"epoch": 56.24,
"learning_rate": 3.958333333333333e-05,
"loss": 0.0643,
"step": 450
},
{
"epoch": 56.97,
"eval_accuracy": 0.7522935779816514,
"eval_f1": 0.7545272459450874,
"eval_loss": 0.5946044325828552,
"eval_precision": 0.7587394976605187,
"eval_recall": 0.7522935779816514,
"eval_runtime": 4.4153,
"eval_samples_per_second": 24.687,
"eval_steps_per_second": 0.453,
"step": 456
},
{
"epoch": 57.48,
"learning_rate": 3.7500000000000003e-05,
"loss": 0.0605,
"step": 460
},
{
"epoch": 57.97,
"eval_accuracy": 0.8073394495412844,
"eval_f1": 0.8120936083458042,
"eval_loss": 0.4887966513633728,
"eval_precision": 0.8238645162528876,
"eval_recall": 0.8073394495412844,
"eval_runtime": 6.6734,
"eval_samples_per_second": 16.334,
"eval_steps_per_second": 0.3,
"step": 464
},
{
"epoch": 58.73,
"learning_rate": 3.541666666666667e-05,
"loss": 0.063,
"step": 470
},
{
"epoch": 58.97,
"eval_accuracy": 0.7889908256880734,
"eval_f1": 0.7936673558168583,
"eval_loss": 0.5916518568992615,
"eval_precision": 0.8051419661311963,
"eval_recall": 0.7889908256880734,
"eval_runtime": 4.2726,
"eval_samples_per_second": 25.511,
"eval_steps_per_second": 0.468,
"step": 472
},
{
"epoch": 59.97,
"learning_rate": 3.3333333333333335e-05,
"loss": 0.0595,
"step": 480
},
{
"epoch": 59.97,
"eval_accuracy": 0.7889908256880734,
"eval_f1": 0.7894285298217145,
"eval_loss": 0.5117025375366211,
"eval_precision": 0.7904302906815871,
"eval_recall": 0.7889908256880734,
"eval_runtime": 4.4288,
"eval_samples_per_second": 24.612,
"eval_steps_per_second": 0.452,
"step": 480
},
{
"epoch": 60.97,
"eval_accuracy": 0.7614678899082569,
"eval_f1": 0.7635438011331693,
"eval_loss": 0.549720048904419,
"eval_precision": 0.769159484755815,
"eval_recall": 0.7614678899082569,
"eval_runtime": 4.2635,
"eval_samples_per_second": 25.566,
"eval_steps_per_second": 0.469,
"step": 488
},
{
"epoch": 61.24,
"learning_rate": 3.125e-05,
"loss": 0.0554,
"step": 490
},
{
"epoch": 61.97,
"eval_accuracy": 0.8165137614678899,
"eval_f1": 0.812552773801982,
"eval_loss": 0.4742366075515747,
"eval_precision": 0.8100926678908328,
"eval_recall": 0.8165137614678899,
"eval_runtime": 4.3801,
"eval_samples_per_second": 24.885,
"eval_steps_per_second": 0.457,
"step": 496
},
{
"epoch": 62.48,
"learning_rate": 2.9166666666666666e-05,
"loss": 0.0557,
"step": 500
},
{
"epoch": 62.97,
"eval_accuracy": 0.7889908256880734,
"eval_f1": 0.7886246853481453,
"eval_loss": 0.5369319915771484,
"eval_precision": 0.7886251828214332,
"eval_recall": 0.7889908256880734,
"eval_runtime": 4.4776,
"eval_samples_per_second": 24.343,
"eval_steps_per_second": 0.447,
"step": 504
},
{
"epoch": 63.73,
"learning_rate": 2.7083333333333335e-05,
"loss": 0.0539,
"step": 510
},
{
"epoch": 63.97,
"eval_accuracy": 0.7889908256880734,
"eval_f1": 0.7898954921921011,
"eval_loss": 0.5439756512641907,
"eval_precision": 0.7922270390160299,
"eval_recall": 0.7889908256880734,
"eval_runtime": 4.4228,
"eval_samples_per_second": 24.645,
"eval_steps_per_second": 0.452,
"step": 512
},
{
"epoch": 64.97,
"learning_rate": 2.5e-05,
"loss": 0.048,
"step": 520
},
{
"epoch": 64.97,
"eval_accuracy": 0.7889908256880734,
"eval_f1": 0.7882784673502429,
"eval_loss": 0.5923751592636108,
"eval_precision": 0.7878178107535906,
"eval_recall": 0.7889908256880734,
"eval_runtime": 5.5392,
"eval_samples_per_second": 19.678,
"eval_steps_per_second": 0.361,
"step": 520
},
{
"epoch": 65.97,
"eval_accuracy": 0.8440366972477065,
"eval_f1": 0.8440366972477065,
"eval_loss": 0.486260324716568,
"eval_precision": 0.8440366972477065,
"eval_recall": 0.8440366972477065,
"eval_runtime": 4.2084,
"eval_samples_per_second": 25.9,
"eval_steps_per_second": 0.475,
"step": 528
},
{
"epoch": 66.24,
"learning_rate": 2.2916666666666667e-05,
"loss": 0.045,
"step": 530
},
{
"epoch": 66.97,
"eval_accuracy": 0.8073394495412844,
"eval_f1": 0.8046694749207712,
"eval_loss": 0.5849686861038208,
"eval_precision": 0.8076432996157767,
"eval_recall": 0.8073394495412844,
"eval_runtime": 4.3405,
"eval_samples_per_second": 25.112,
"eval_steps_per_second": 0.461,
"step": 536
},
{
"epoch": 67.48,
"learning_rate": 2.0833333333333333e-05,
"loss": 0.047,
"step": 540
},
{
"epoch": 67.97,
"eval_accuracy": 0.8256880733944955,
"eval_f1": 0.8227139701424718,
"eval_loss": 0.4938836991786957,
"eval_precision": 0.8211639886949021,
"eval_recall": 0.8256880733944955,
"eval_runtime": 4.2943,
"eval_samples_per_second": 25.382,
"eval_steps_per_second": 0.466,
"step": 544
},
{
"epoch": 68.73,
"learning_rate": 1.8750000000000002e-05,
"loss": 0.0412,
"step": 550
},
{
"epoch": 68.97,
"eval_accuracy": 0.7889908256880734,
"eval_f1": 0.7899819010172877,
"eval_loss": 0.4850451946258545,
"eval_precision": 0.7911629060252914,
"eval_recall": 0.7889908256880734,
"eval_runtime": 4.3733,
"eval_samples_per_second": 24.924,
"eval_steps_per_second": 0.457,
"step": 552
},
{
"epoch": 69.97,
"learning_rate": 1.6666666666666667e-05,
"loss": 0.0392,
"step": 560
},
{
"epoch": 69.97,
"eval_accuracy": 0.8256880733944955,
"eval_f1": 0.8257529642156887,
"eval_loss": 0.5065794587135315,
"eval_precision": 0.8264957264957264,
"eval_recall": 0.8256880733944955,
"eval_runtime": 4.2901,
"eval_samples_per_second": 25.407,
"eval_steps_per_second": 0.466,
"step": 560
},
{
"epoch": 70.97,
"eval_accuracy": 0.8073394495412844,
"eval_f1": 0.8058135764557783,
"eval_loss": 0.49649733304977417,
"eval_precision": 0.8053007135575942,
"eval_recall": 0.8073394495412844,
"eval_runtime": 4.1424,
"eval_samples_per_second": 26.313,
"eval_steps_per_second": 0.483,
"step": 568
},
{
"epoch": 71.24,
"learning_rate": 1.4583333333333333e-05,
"loss": 0.0423,
"step": 570
},
{
"epoch": 71.97,
"eval_accuracy": 0.8348623853211009,
"eval_f1": 0.8350885030999028,
"eval_loss": 0.47168704867362976,
"eval_precision": 0.8376424034680915,
"eval_recall": 0.8348623853211009,
"eval_runtime": 4.1897,
"eval_samples_per_second": 26.016,
"eval_steps_per_second": 0.477,
"step": 576
},
{
"epoch": 72.48,
"learning_rate": 1.25e-05,
"loss": 0.0471,
"step": 580
},
{
"epoch": 72.97,
"eval_accuracy": 0.8256880733944955,
"eval_f1": 0.8295520158325865,
"eval_loss": 0.48450949788093567,
"eval_precision": 0.837811160528748,
"eval_recall": 0.8256880733944955,
"eval_runtime": 4.2446,
"eval_samples_per_second": 25.68,
"eval_steps_per_second": 0.471,
"step": 584
},
{
"epoch": 73.73,
"learning_rate": 1.0416666666666666e-05,
"loss": 0.0322,
"step": 590
},
{
"epoch": 73.97,
"eval_accuracy": 0.7706422018348624,
"eval_f1": 0.7692886041532689,
"eval_loss": 0.5188109278678894,
"eval_precision": 0.7689271840647987,
"eval_recall": 0.7706422018348624,
"eval_runtime": 4.4833,
"eval_samples_per_second": 24.313,
"eval_steps_per_second": 0.446,
"step": 592
},
{
"epoch": 74.97,
"learning_rate": 8.333333333333334e-06,
"loss": 0.042,
"step": 600
},
{
"epoch": 74.97,
"eval_accuracy": 0.7706422018348624,
"eval_f1": 0.7700888306392893,
"eval_loss": 0.5242283940315247,
"eval_precision": 0.7698942959712803,
"eval_recall": 0.7706422018348624,
"eval_runtime": 4.4923,
"eval_samples_per_second": 24.264,
"eval_steps_per_second": 0.445,
"step": 600
},
{
"epoch": 75.97,
"eval_accuracy": 0.7798165137614679,
"eval_f1": 0.7803733958918072,
"eval_loss": 0.5945499539375305,
"eval_precision": 0.7823930357635982,
"eval_recall": 0.7798165137614679,
"eval_runtime": 5.1633,
"eval_samples_per_second": 21.111,
"eval_steps_per_second": 0.387,
"step": 608
},
{
"epoch": 76.24,
"learning_rate": 6.25e-06,
"loss": 0.0416,
"step": 610
},
{
"epoch": 76.97,
"eval_accuracy": 0.7981651376146789,
"eval_f1": 0.7993445642022374,
"eval_loss": 0.5432426929473877,
"eval_precision": 0.8038185145085823,
"eval_recall": 0.7981651376146789,
"eval_runtime": 4.2234,
"eval_samples_per_second": 25.809,
"eval_steps_per_second": 0.474,
"step": 616
},
{
"epoch": 77.48,
"learning_rate": 4.166666666666667e-06,
"loss": 0.0399,
"step": 620
},
{
"epoch": 77.97,
"eval_accuracy": 0.7981651376146789,
"eval_f1": 0.7994120087594209,
"eval_loss": 0.5381362438201904,
"eval_precision": 0.8072242548450546,
"eval_recall": 0.7981651376146789,
"eval_runtime": 4.2152,
"eval_samples_per_second": 25.859,
"eval_steps_per_second": 0.474,
"step": 624
},
{
"epoch": 78.73,
"learning_rate": 2.0833333333333334e-06,
"loss": 0.0439,
"step": 630
},
{
"epoch": 78.97,
"eval_accuracy": 0.7798165137614679,
"eval_f1": 0.7827462243679189,
"eval_loss": 0.6181262135505676,
"eval_precision": 0.7877941763063422,
"eval_recall": 0.7798165137614679,
"eval_runtime": 4.2424,
"eval_samples_per_second": 25.693,
"eval_steps_per_second": 0.471,
"step": 632
},
{
"epoch": 79.97,
"learning_rate": 0.0,
"loss": 0.0462,
"step": 640
},
{
"epoch": 79.97,
"eval_accuracy": 0.8165137614678899,
"eval_f1": 0.8172526992448356,
"eval_loss": 0.48008766770362854,
"eval_precision": 0.8181998512273742,
"eval_recall": 0.8165137614678899,
"eval_runtime": 4.18,
"eval_samples_per_second": 26.076,
"eval_steps_per_second": 0.478,
"step": 640
},
{
"epoch": 79.97,
"step": 640,
"total_flos": 3.5167284631649157e+18,
"train_loss": 0.37728101573884487,
"train_runtime": 2345.4183,
"train_samples_per_second": 70.606,
"train_steps_per_second": 0.273
}
],
"max_steps": 640,
"num_train_epochs": 80,
"total_flos": 3.5167284631649157e+18,
"trial_name": null,
"trial_params": null
}