llama_8b_lima_40 / trainer_log.jsonl
OpenLeecher's picture
Model save
1e78fdd verified
{"current_steps": 5, "total_steps": 1040, "loss": 1.275, "lr": 7.142857142857143e-07, "epoch": 0.004807692307692308, "percentage": 0.48, "elapsed_time": "0:00:58", "remaining_time": "3:22:01"}
{"current_steps": 10, "total_steps": 1040, "loss": 1.0842, "lr": 1.4285714285714286e-06, "epoch": 0.009615384615384616, "percentage": 0.96, "elapsed_time": "0:01:38", "remaining_time": "2:48:39"}
{"current_steps": 15, "total_steps": 1040, "loss": 1.0731, "lr": 2.142857142857143e-06, "epoch": 0.014423076923076924, "percentage": 1.44, "elapsed_time": "0:02:16", "remaining_time": "2:35:48"}
{"current_steps": 20, "total_steps": 1040, "loss": 0.9966, "lr": 2.8571428571428573e-06, "epoch": 0.019230769230769232, "percentage": 1.92, "elapsed_time": "0:02:53", "remaining_time": "2:27:53"}
{"current_steps": 25, "total_steps": 1040, "loss": 0.9506, "lr": 3.5714285714285714e-06, "epoch": 0.02403846153846154, "percentage": 2.4, "elapsed_time": "0:03:32", "remaining_time": "2:23:27"}
{"current_steps": 30, "total_steps": 1040, "loss": 0.9081, "lr": 4.285714285714286e-06, "epoch": 0.028846153846153848, "percentage": 2.88, "elapsed_time": "0:04:10", "remaining_time": "2:20:47"}
{"current_steps": 35, "total_steps": 1040, "loss": 0.9839, "lr": 5e-06, "epoch": 0.03365384615384615, "percentage": 3.37, "elapsed_time": "0:04:50", "remaining_time": "2:19:03"}
{"current_steps": 40, "total_steps": 1040, "loss": 0.9143, "lr": 5.7142857142857145e-06, "epoch": 0.038461538461538464, "percentage": 3.85, "elapsed_time": "0:05:31", "remaining_time": "2:18:00"}
{"current_steps": 45, "total_steps": 1040, "loss": 1.0449, "lr": 5.958760472832704e-06, "epoch": 0.04326923076923077, "percentage": 4.33, "elapsed_time": "0:06:09", "remaining_time": "2:16:13"}
{"current_steps": 50, "total_steps": 1040, "loss": 1.1233, "lr": 5.890441320869003e-06, "epoch": 0.04807692307692308, "percentage": 4.81, "elapsed_time": "0:06:55", "remaining_time": "2:17:07"}
{"current_steps": 55, "total_steps": 1040, "loss": 0.7838, "lr": 5.822637783235761e-06, "epoch": 0.052884615384615384, "percentage": 5.29, "elapsed_time": "0:07:25", "remaining_time": "2:13:06"}
{"current_steps": 60, "total_steps": 1040, "loss": 0.937, "lr": 5.755348556225628e-06, "epoch": 0.057692307692307696, "percentage": 5.77, "elapsed_time": "0:08:00", "remaining_time": "2:10:51"}
{"current_steps": 65, "total_steps": 1040, "loss": 0.9261, "lr": 5.688572332818116e-06, "epoch": 0.0625, "percentage": 6.25, "elapsed_time": "0:08:44", "remaining_time": "2:11:08"}
{"current_steps": 70, "total_steps": 1040, "loss": 0.929, "lr": 5.622307802654199e-06, "epoch": 0.0673076923076923, "percentage": 6.73, "elapsed_time": "0:09:19", "remaining_time": "2:09:13"}
{"current_steps": 75, "total_steps": 1040, "loss": 1.0281, "lr": 5.556553652010609e-06, "epoch": 0.07211538461538461, "percentage": 7.21, "elapsed_time": "0:10:10", "remaining_time": "2:10:56"}
{"current_steps": 80, "total_steps": 1040, "loss": 1.0252, "lr": 5.4913085637737825e-06, "epoch": 0.07692307692307693, "percentage": 7.69, "elapsed_time": "0:10:55", "remaining_time": "2:11:05"}
{"current_steps": 80, "total_steps": 1040, "eval_loss": 1.0117295980453491, "epoch": 0.07692307692307693, "percentage": 7.69, "elapsed_time": "0:11:17", "remaining_time": "2:15:31"}
{"current_steps": 85, "total_steps": 1040, "loss": 0.9798, "lr": 5.42657121741348e-06, "epoch": 0.08173076923076923, "percentage": 8.17, "elapsed_time": "0:11:54", "remaining_time": "2:13:50"}
{"current_steps": 90, "total_steps": 1040, "loss": 0.9422, "lr": 5.362340288956054e-06, "epoch": 0.08653846153846154, "percentage": 8.65, "elapsed_time": "0:12:30", "remaining_time": "2:12:06"}
{"current_steps": 95, "total_steps": 1040, "loss": 0.7751, "lr": 5.298614450957377e-06, "epoch": 0.09134615384615384, "percentage": 9.13, "elapsed_time": "0:13:05", "remaining_time": "2:10:16"}
{"current_steps": 100, "total_steps": 1040, "loss": 1.0559, "lr": 5.235392372475402e-06, "epoch": 0.09615384615384616, "percentage": 9.62, "elapsed_time": "0:13:47", "remaining_time": "2:09:34"}
{"current_steps": 105, "total_steps": 1040, "loss": 0.8535, "lr": 5.1726727190423596e-06, "epoch": 0.10096153846153846, "percentage": 10.1, "elapsed_time": "0:14:19", "remaining_time": "2:07:31"}
{"current_steps": 110, "total_steps": 1040, "loss": 1.0847, "lr": 5.110454152636601e-06, "epoch": 0.10576923076923077, "percentage": 10.58, "elapsed_time": "0:15:02", "remaining_time": "2:07:13"}
{"current_steps": 115, "total_steps": 1040, "loss": 0.989, "lr": 5.04873533165404e-06, "epoch": 0.11057692307692307, "percentage": 11.06, "elapsed_time": "0:15:43", "remaining_time": "2:06:29"}
{"current_steps": 120, "total_steps": 1040, "loss": 0.7562, "lr": 4.987514910879233e-06, "epoch": 0.11538461538461539, "percentage": 11.54, "elapsed_time": "0:16:17", "remaining_time": "2:04:51"}
{"current_steps": 125, "total_steps": 1040, "loss": 0.882, "lr": 4.9267915414560465e-06, "epoch": 0.1201923076923077, "percentage": 12.02, "elapsed_time": "0:16:50", "remaining_time": "2:03:18"}
{"current_steps": 130, "total_steps": 1040, "loss": 0.8461, "lr": 4.866563870857949e-06, "epoch": 0.125, "percentage": 12.5, "elapsed_time": "0:17:23", "remaining_time": "2:01:44"}
{"current_steps": 135, "total_steps": 1040, "loss": 1.0949, "lr": 4.806830542857871e-06, "epoch": 0.12980769230769232, "percentage": 12.98, "elapsed_time": "0:18:07", "remaining_time": "2:01:29"}
{"current_steps": 140, "total_steps": 1040, "loss": 0.9741, "lr": 4.7475901974976784e-06, "epoch": 0.1346153846153846, "percentage": 13.46, "elapsed_time": "0:18:47", "remaining_time": "2:00:48"}
{"current_steps": 145, "total_steps": 1040, "loss": 0.8267, "lr": 4.688841471057191e-06, "epoch": 0.13942307692307693, "percentage": 13.94, "elapsed_time": "0:19:21", "remaining_time": "1:59:30"}
{"current_steps": 150, "total_steps": 1040, "loss": 0.9237, "lr": 4.630582996022805e-06, "epoch": 0.14423076923076922, "percentage": 14.42, "elapsed_time": "0:20:00", "remaining_time": "1:58:41"}
{"current_steps": 155, "total_steps": 1040, "loss": 0.9735, "lr": 4.572813401055646e-06, "epoch": 0.14903846153846154, "percentage": 14.9, "elapsed_time": "0:20:38", "remaining_time": "1:57:49"}
{"current_steps": 160, "total_steps": 1040, "loss": 0.8185, "lr": 4.515531310959294e-06, "epoch": 0.15384615384615385, "percentage": 15.38, "elapsed_time": "0:21:18", "remaining_time": "1:57:11"}
{"current_steps": 160, "total_steps": 1040, "eval_loss": 0.9820164442062378, "epoch": 0.15384615384615385, "percentage": 15.38, "elapsed_time": "0:21:39", "remaining_time": "1:59:05"}
{"current_steps": 165, "total_steps": 1040, "loss": 0.9701, "lr": 4.458735346647049e-06, "epoch": 0.15865384615384615, "percentage": 15.87, "elapsed_time": "0:22:15", "remaining_time": "1:57:59"}
{"current_steps": 170, "total_steps": 1040, "loss": 0.7428, "lr": 4.402424125108714e-06, "epoch": 0.16346153846153846, "percentage": 16.35, "elapsed_time": "0:22:48", "remaining_time": "1:56:43"}
{"current_steps": 175, "total_steps": 1040, "loss": 1.0573, "lr": 4.346596259376934e-06, "epoch": 0.16826923076923078, "percentage": 16.83, "elapsed_time": "0:23:32", "remaining_time": "1:56:19"}
{"current_steps": 180, "total_steps": 1040, "loss": 0.99, "lr": 4.291250358493015e-06, "epoch": 0.17307692307692307, "percentage": 17.31, "elapsed_time": "0:24:13", "remaining_time": "1:55:43"}
{"current_steps": 185, "total_steps": 1040, "loss": 0.9208, "lr": 4.236385027472282e-06, "epoch": 0.1778846153846154, "percentage": 17.79, "elapsed_time": "0:24:48", "remaining_time": "1:54:41"}
{"current_steps": 190, "total_steps": 1040, "loss": 0.9552, "lr": 4.181998867268901e-06, "epoch": 0.18269230769230768, "percentage": 18.27, "elapsed_time": "0:25:26", "remaining_time": "1:53:50"}
{"current_steps": 195, "total_steps": 1040, "loss": 0.9004, "lr": 4.1280904747402165e-06, "epoch": 0.1875, "percentage": 18.75, "elapsed_time": "0:26:01", "remaining_time": "1:52:48"}
{"current_steps": 200, "total_steps": 1040, "loss": 1.0189, "lr": 4.07465844261054e-06, "epoch": 0.19230769230769232, "percentage": 19.23, "elapsed_time": "0:26:47", "remaining_time": "1:52:32"}
{"current_steps": 205, "total_steps": 1040, "loss": 0.8663, "lr": 4.021701359434411e-06, "epoch": 0.1971153846153846, "percentage": 19.71, "elapsed_time": "0:27:24", "remaining_time": "1:51:36"}
{"current_steps": 210, "total_steps": 1040, "loss": 0.9191, "lr": 3.9692178095593185e-06, "epoch": 0.20192307692307693, "percentage": 20.19, "elapsed_time": "0:28:11", "remaining_time": "1:51:26"}
{"current_steps": 215, "total_steps": 1040, "loss": 0.8463, "lr": 3.917206373087843e-06, "epoch": 0.20673076923076922, "percentage": 20.67, "elapsed_time": "0:28:47", "remaining_time": "1:50:29"}
{"current_steps": 220, "total_steps": 1040, "loss": 0.9113, "lr": 3.86566562583925e-06, "epoch": 0.21153846153846154, "percentage": 21.15, "elapsed_time": "0:29:31", "remaining_time": "1:50:03"}
{"current_steps": 225, "total_steps": 1040, "loss": 0.8026, "lr": 3.814594139310489e-06, "epoch": 0.21634615384615385, "percentage": 21.63, "elapsed_time": "0:30:09", "remaining_time": "1:49:14"}
{"current_steps": 230, "total_steps": 1040, "loss": 1.0014, "lr": 3.7639904806365957e-06, "epoch": 0.22115384615384615, "percentage": 22.12, "elapsed_time": "0:30:50", "remaining_time": "1:48:37"}
{"current_steps": 235, "total_steps": 1040, "loss": 0.8704, "lr": 3.7138532125504874e-06, "epoch": 0.22596153846153846, "percentage": 22.6, "elapsed_time": "0:31:33", "remaining_time": "1:48:07"}
{"current_steps": 240, "total_steps": 1040, "loss": 0.9686, "lr": 3.664180893342146e-06, "epoch": 0.23076923076923078, "percentage": 23.08, "elapsed_time": "0:32:20", "remaining_time": "1:47:49"}
{"current_steps": 240, "total_steps": 1040, "eval_loss": 0.9701676964759827, "epoch": 0.23076923076923078, "percentage": 23.08, "elapsed_time": "0:32:41", "remaining_time": "1:48:59"}
{"current_steps": 245, "total_steps": 1040, "loss": 0.9927, "lr": 3.6149720768171497e-06, "epoch": 0.23557692307692307, "percentage": 23.56, "elapsed_time": "0:33:20", "remaining_time": "1:48:12"}
{"current_steps": 250, "total_steps": 1040, "loss": 0.8335, "lr": 3.5662253122545742e-06, "epoch": 0.2403846153846154, "percentage": 24.04, "elapsed_time": "0:33:57", "remaining_time": "1:47:18"}
{"current_steps": 255, "total_steps": 1040, "loss": 0.9225, "lr": 3.517939144364211e-06, "epoch": 0.24519230769230768, "percentage": 24.52, "elapsed_time": "0:34:35", "remaining_time": "1:46:28"}
{"current_steps": 260, "total_steps": 1040, "loss": 0.9645, "lr": 3.4701121132431283e-06, "epoch": 0.25, "percentage": 25.0, "elapsed_time": "0:35:19", "remaining_time": "1:45:57"}
{"current_steps": 265, "total_steps": 1040, "loss": 1.0596, "lr": 3.422742754331519e-06, "epoch": 0.2548076923076923, "percentage": 25.48, "elapsed_time": "0:36:03", "remaining_time": "1:45:27"}
{"current_steps": 270, "total_steps": 1040, "loss": 0.8279, "lr": 3.3758295983678575e-06, "epoch": 0.25961538461538464, "percentage": 25.96, "elapsed_time": "0:36:38", "remaining_time": "1:44:29"}
{"current_steps": 275, "total_steps": 1040, "loss": 0.7653, "lr": 3.329371171343321e-06, "epoch": 0.2644230769230769, "percentage": 26.44, "elapsed_time": "0:37:14", "remaining_time": "1:43:35"}
{"current_steps": 280, "total_steps": 1040, "loss": 0.8703, "lr": 3.2833659944554757e-06, "epoch": 0.2692307692307692, "percentage": 26.92, "elapsed_time": "0:37:56", "remaining_time": "1:42:58"}
{"current_steps": 285, "total_steps": 1040, "loss": 0.826, "lr": 3.2378125840611978e-06, "epoch": 0.27403846153846156, "percentage": 27.4, "elapsed_time": "0:38:29", "remaining_time": "1:41:57"}
{"current_steps": 290, "total_steps": 1040, "loss": 0.8617, "lr": 3.192709451628821e-06, "epoch": 0.27884615384615385, "percentage": 27.88, "elapsed_time": "0:39:08", "remaining_time": "1:41:13"}
{"current_steps": 295, "total_steps": 1040, "loss": 0.9925, "lr": 3.1480551036895063e-06, "epoch": 0.28365384615384615, "percentage": 28.37, "elapsed_time": "0:39:48", "remaining_time": "1:40:31"}
{"current_steps": 300, "total_steps": 1040, "loss": 0.8276, "lr": 3.1038480417877728e-06, "epoch": 0.28846153846153844, "percentage": 28.85, "elapsed_time": "0:40:25", "remaining_time": "1:39:43"}
{"current_steps": 305, "total_steps": 1040, "loss": 0.93, "lr": 3.0600867624312124e-06, "epoch": 0.2932692307692308, "percentage": 29.33, "elapsed_time": "0:41:02", "remaining_time": "1:38:53"}
{"current_steps": 310, "total_steps": 1040, "loss": 0.9093, "lr": 3.0167697570393586e-06, "epoch": 0.2980769230769231, "percentage": 29.81, "elapsed_time": "0:41:40", "remaining_time": "1:38:08"}
{"current_steps": 315, "total_steps": 1040, "loss": 0.8436, "lr": 2.973895511891673e-06, "epoch": 0.30288461538461536, "percentage": 30.29, "elapsed_time": "0:42:19", "remaining_time": "1:37:24"}
{"current_steps": 320, "total_steps": 1040, "loss": 0.7962, "lr": 2.9314625080746407e-06, "epoch": 0.3076923076923077, "percentage": 30.77, "elapsed_time": "0:42:53", "remaining_time": "1:36:30"}
{"current_steps": 320, "total_steps": 1040, "eval_loss": 0.9604336619377136, "epoch": 0.3076923076923077, "percentage": 30.77, "elapsed_time": "0:43:14", "remaining_time": "1:37:16"}
{"current_steps": 325, "total_steps": 1040, "loss": 0.9501, "lr": 2.8894692214279614e-06, "epoch": 0.3125, "percentage": 31.25, "elapsed_time": "0:43:57", "remaining_time": "1:36:43"}
{"current_steps": 330, "total_steps": 1040, "loss": 0.8932, "lr": 2.8479141224897947e-06, "epoch": 0.3173076923076923, "percentage": 31.73, "elapsed_time": "0:44:38", "remaining_time": "1:36:01"}
{"current_steps": 335, "total_steps": 1040, "loss": 0.8509, "lr": 2.806795676441052e-06, "epoch": 0.32211538461538464, "percentage": 32.21, "elapsed_time": "0:45:15", "remaining_time": "1:35:13"}
{"current_steps": 340, "total_steps": 1040, "loss": 0.8531, "lr": 2.7661123430487023e-06, "epoch": 0.3269230769230769, "percentage": 32.69, "elapsed_time": "0:45:56", "remaining_time": "1:34:34"}
{"current_steps": 345, "total_steps": 1040, "loss": 0.8428, "lr": 2.725862576608072e-06, "epoch": 0.3317307692307692, "percentage": 33.17, "elapsed_time": "0:46:34", "remaining_time": "1:33:49"}
{"current_steps": 350, "total_steps": 1040, "loss": 0.9324, "lr": 2.6860448258841182e-06, "epoch": 0.33653846153846156, "percentage": 33.65, "elapsed_time": "0:47:13", "remaining_time": "1:33:06"}
{"current_steps": 355, "total_steps": 1040, "loss": 0.8302, "lr": 2.6466575340516312e-06, "epoch": 0.34134615384615385, "percentage": 34.13, "elapsed_time": "0:47:48", "remaining_time": "1:32:15"}
{"current_steps": 360, "total_steps": 1040, "loss": 1.0338, "lr": 2.607699138634365e-06, "epoch": 0.34615384615384615, "percentage": 34.62, "elapsed_time": "0:48:34", "remaining_time": "1:31:45"}
{"current_steps": 365, "total_steps": 1040, "loss": 0.781, "lr": 2.5691680714430463e-06, "epoch": 0.35096153846153844, "percentage": 35.1, "elapsed_time": "0:49:06", "remaining_time": "1:30:49"}
{"current_steps": 370, "total_steps": 1040, "loss": 0.9277, "lr": 2.531062758512248e-06, "epoch": 0.3557692307692308, "percentage": 35.58, "elapsed_time": "0:49:45", "remaining_time": "1:30:06"}
{"current_steps": 375, "total_steps": 1040, "loss": 0.7648, "lr": 2.493381620036082e-06, "epoch": 0.3605769230769231, "percentage": 36.06, "elapsed_time": "0:50:17", "remaining_time": "1:29:10"}
{"current_steps": 380, "total_steps": 1040, "loss": 0.7278, "lr": 2.4561230703027005e-06, "epoch": 0.36538461538461536, "percentage": 36.54, "elapsed_time": "0:50:49", "remaining_time": "1:28:16"}
{"current_steps": 385, "total_steps": 1040, "loss": 0.7564, "lr": 2.4192855176275597e-06, "epoch": 0.3701923076923077, "percentage": 37.02, "elapsed_time": "0:51:24", "remaining_time": "1:27:28"}
{"current_steps": 390, "total_steps": 1040, "loss": 0.7983, "lr": 2.382867364285416e-06, "epoch": 0.375, "percentage": 37.5, "elapsed_time": "0:51:57", "remaining_time": "1:26:36"}
{"current_steps": 395, "total_steps": 1040, "loss": 0.9005, "lr": 2.3468670064410194e-06, "epoch": 0.3798076923076923, "percentage": 37.98, "elapsed_time": "0:52:40", "remaining_time": "1:26:01"}
{"current_steps": 400, "total_steps": 1040, "loss": 0.8669, "lr": 2.3112828340784763e-06, "epoch": 0.38461538461538464, "percentage": 38.46, "elapsed_time": "0:53:18", "remaining_time": "1:25:17"}
{"current_steps": 400, "total_steps": 1040, "eval_loss": 0.9519588351249695, "epoch": 0.38461538461538464, "percentage": 38.46, "elapsed_time": "0:53:39", "remaining_time": "1:25:50"}
{"current_steps": 405, "total_steps": 1040, "loss": 0.8864, "lr": 2.2761132309292435e-06, "epoch": 0.3894230769230769, "percentage": 38.94, "elapsed_time": "0:54:15", "remaining_time": "1:25:04"}
{"current_steps": 410, "total_steps": 1040, "loss": 0.9219, "lr": 2.241356574398701e-06, "epoch": 0.3942307692307692, "percentage": 39.42, "elapsed_time": "0:54:52", "remaining_time": "1:24:19"}
{"current_steps": 415, "total_steps": 1040, "loss": 0.9542, "lr": 2.2070112354912867e-06, "epoch": 0.39903846153846156, "percentage": 39.9, "elapsed_time": "0:55:32", "remaining_time": "1:23:38"}
{"current_steps": 420, "total_steps": 1040, "loss": 0.7828, "lr": 2.1730755787341422e-06, "epoch": 0.40384615384615385, "percentage": 40.38, "elapsed_time": "0:56:12", "remaining_time": "1:22:58"}
{"current_steps": 425, "total_steps": 1040, "loss": 0.9213, "lr": 2.1395479620992237e-06, "epoch": 0.40865384615384615, "percentage": 40.87, "elapsed_time": "0:56:49", "remaining_time": "1:22:14"}
{"current_steps": 430, "total_steps": 1040, "loss": 0.8832, "lr": 2.1064267369238405e-06, "epoch": 0.41346153846153844, "percentage": 41.35, "elapsed_time": "0:57:28", "remaining_time": "1:21:31"}
{"current_steps": 435, "total_steps": 1040, "loss": 1.0524, "lr": 2.0737102478295753e-06, "epoch": 0.4182692307692308, "percentage": 41.83, "elapsed_time": "0:58:13", "remaining_time": "1:20:58"}
{"current_steps": 440, "total_steps": 1040, "loss": 0.8951, "lr": 2.0413968326395454e-06, "epoch": 0.4230769230769231, "percentage": 42.31, "elapsed_time": "0:58:50", "remaining_time": "1:20:14"}
{"current_steps": 445, "total_steps": 1040, "loss": 0.8803, "lr": 2.009484822293941e-06, "epoch": 0.42788461538461536, "percentage": 42.79, "elapsed_time": "0:59:27", "remaining_time": "1:19:30"}
{"current_steps": 450, "total_steps": 1040, "loss": 0.8575, "lr": 1.9779725407638038e-06, "epoch": 0.4326923076923077, "percentage": 43.27, "elapsed_time": "1:00:01", "remaining_time": "1:18:42"}
{"current_steps": 455, "total_steps": 1040, "loss": 0.874, "lr": 1.946858304962993e-06, "epoch": 0.4375, "percentage": 43.75, "elapsed_time": "1:00:35", "remaining_time": "1:17:54"}
{"current_steps": 460, "total_steps": 1040, "loss": 1.0103, "lr": 1.9161404246582834e-06, "epoch": 0.4423076923076923, "percentage": 44.23, "elapsed_time": "1:01:18", "remaining_time": "1:17:18"}
{"current_steps": 465, "total_steps": 1040, "loss": 0.8943, "lr": 1.8858172023775289e-06, "epoch": 0.44711538461538464, "percentage": 44.71, "elapsed_time": "1:02:01", "remaining_time": "1:16:41"}
{"current_steps": 470, "total_steps": 1040, "loss": 0.9638, "lr": 1.8558869333158512e-06, "epoch": 0.4519230769230769, "percentage": 45.19, "elapsed_time": "1:02:40", "remaining_time": "1:16:00"}
{"current_steps": 475, "total_steps": 1040, "loss": 0.8781, "lr": 1.8263479052397838e-06, "epoch": 0.4567307692307692, "percentage": 45.67, "elapsed_time": "1:03:18", "remaining_time": "1:15:18"}
{"current_steps": 480, "total_steps": 1040, "loss": 0.8883, "lr": 1.7971983983893046e-06, "epoch": 0.46153846153846156, "percentage": 46.15, "elapsed_time": "1:04:03", "remaining_time": "1:14:43"}
{"current_steps": 480, "total_steps": 1040, "eval_loss": 0.9505824446678162, "epoch": 0.46153846153846156, "percentage": 46.15, "elapsed_time": "1:04:23", "remaining_time": "1:15:07"}
{"current_steps": 485, "total_steps": 1040, "loss": 0.7087, "lr": 1.768436685377699e-06, "epoch": 0.46634615384615385, "percentage": 46.63, "elapsed_time": "1:05:01", "remaining_time": "1:14:24"}
{"current_steps": 490, "total_steps": 1040, "loss": 0.928, "lr": 1.7400610310891816e-06, "epoch": 0.47115384615384615, "percentage": 47.12, "elapsed_time": "1:05:47", "remaining_time": "1:13:51"}
{"current_steps": 495, "total_steps": 1040, "loss": 0.8047, "lr": 1.7120696925742107e-06, "epoch": 0.47596153846153844, "percentage": 47.6, "elapsed_time": "1:06:35", "remaining_time": "1:13:18"}
{"current_steps": 500, "total_steps": 1040, "loss": 1.0923, "lr": 1.6844609189424112e-06, "epoch": 0.4807692307692308, "percentage": 48.08, "elapsed_time": "1:07:18", "remaining_time": "1:12:41"}
{"current_steps": 505, "total_steps": 1040, "loss": 0.7718, "lr": 1.6572329512530394e-06, "epoch": 0.4855769230769231, "percentage": 48.56, "elapsed_time": "1:07:54", "remaining_time": "1:11:56"}
{"current_steps": 510, "total_steps": 1040, "loss": 0.7462, "lr": 1.630384022402907e-06, "epoch": 0.49038461538461536, "percentage": 49.04, "elapsed_time": "1:08:31", "remaining_time": "1:11:12"}
{"current_steps": 515, "total_steps": 1040, "loss": 0.965, "lr": 1.6039123570116796e-06, "epoch": 0.4951923076923077, "percentage": 49.52, "elapsed_time": "1:09:13", "remaining_time": "1:10:34"}
{"current_steps": 520, "total_steps": 1040, "loss": 0.8943, "lr": 1.5778161713044614e-06, "epoch": 0.5, "percentage": 50.0, "elapsed_time": "1:09:52", "remaining_time": "1:09:52"}
{"current_steps": 525, "total_steps": 1040, "loss": 0.9694, "lr": 1.5520936729915777e-06, "epoch": 0.5048076923076923, "percentage": 50.48, "elapsed_time": "1:10:36", "remaining_time": "1:09:16"}
{"current_steps": 530, "total_steps": 1040, "loss": 0.8589, "lr": 1.5267430611454654e-06, "epoch": 0.5096153846153846, "percentage": 50.96, "elapsed_time": "1:11:12", "remaining_time": "1:08:31"}
{"current_steps": 535, "total_steps": 1040, "loss": 0.8761, "lr": 1.5017625260745615e-06, "epoch": 0.5144230769230769, "percentage": 51.44, "elapsed_time": "1:11:53", "remaining_time": "1:07:51"}
{"current_steps": 540, "total_steps": 1040, "loss": 0.9293, "lr": 1.4771502491940911e-06, "epoch": 0.5192307692307693, "percentage": 51.92, "elapsed_time": "1:12:34", "remaining_time": "1:07:12"}
{"current_steps": 545, "total_steps": 1040, "loss": 0.7738, "lr": 1.4529044028936606e-06, "epoch": 0.5240384615384616, "percentage": 52.4, "elapsed_time": "1:13:12", "remaining_time": "1:06:29"}
{"current_steps": 550, "total_steps": 1040, "loss": 0.8173, "lr": 1.4290231504015187e-06, "epoch": 0.5288461538461539, "percentage": 52.88, "elapsed_time": "1:13:46", "remaining_time": "1:05:43"}
{"current_steps": 555, "total_steps": 1040, "loss": 1.0166, "lr": 1.4055046456453867e-06, "epoch": 0.5336538461538461, "percentage": 53.37, "elapsed_time": "1:14:29", "remaining_time": "1:05:05"}
{"current_steps": 560, "total_steps": 1040, "loss": 0.7636, "lr": 1.3823470331097324e-06, "epoch": 0.5384615384615384, "percentage": 53.85, "elapsed_time": "1:15:06", "remaining_time": "1:04:22"}
{"current_steps": 560, "total_steps": 1040, "eval_loss": 0.9441266059875488, "epoch": 0.5384615384615384, "percentage": 53.85, "elapsed_time": "1:15:27", "remaining_time": "1:04:40"}
{"current_steps": 565, "total_steps": 1040, "loss": 0.9229, "lr": 1.3595484476893454e-06, "epoch": 0.5432692307692307, "percentage": 54.33, "elapsed_time": "1:16:04", "remaining_time": "1:03:57"}
{"current_steps": 570, "total_steps": 1040, "loss": 0.8806, "lr": 1.3371070145391023e-06, "epoch": 0.5480769230769231, "percentage": 54.81, "elapsed_time": "1:16:47", "remaining_time": "1:03:18"}
{"current_steps": 575, "total_steps": 1040, "loss": 0.7314, "lr": 1.3150208489197545e-06, "epoch": 0.5528846153846154, "percentage": 55.29, "elapsed_time": "1:17:24", "remaining_time": "1:02:36"}
{"current_steps": 580, "total_steps": 1040, "loss": 0.819, "lr": 1.2932880560396128e-06, "epoch": 0.5576923076923077, "percentage": 55.77, "elapsed_time": "1:18:10", "remaining_time": "1:02:00"}
{"current_steps": 585, "total_steps": 1040, "loss": 0.7222, "lr": 1.2719067308919584e-06, "epoch": 0.5625, "percentage": 56.25, "elapsed_time": "1:18:42", "remaining_time": "1:01:13"}
{"current_steps": 590, "total_steps": 1040, "loss": 0.8022, "lr": 1.2508749580880287e-06, "epoch": 0.5673076923076923, "percentage": 56.73, "elapsed_time": "1:19:19", "remaining_time": "1:00:30"}
{"current_steps": 595, "total_steps": 1040, "loss": 0.884, "lr": 1.2301908116853925e-06, "epoch": 0.5721153846153846, "percentage": 57.21, "elapsed_time": "1:19:57", "remaining_time": "0:59:48"}
{"current_steps": 600, "total_steps": 1040, "loss": 1.0023, "lr": 1.2098523550115558e-06, "epoch": 0.5769230769230769, "percentage": 57.69, "elapsed_time": "1:20:46", "remaining_time": "0:59:14"}
{"current_steps": 605, "total_steps": 1040, "loss": 0.9518, "lr": 1.189857640482588e-06, "epoch": 0.5817307692307693, "percentage": 58.17, "elapsed_time": "1:21:28", "remaining_time": "0:58:35"}
{"current_steps": 610, "total_steps": 1040, "loss": 0.8211, "lr": 1.170204709416585e-06, "epoch": 0.5865384615384616, "percentage": 58.65, "elapsed_time": "1:22:04", "remaining_time": "0:57:51"}
{"current_steps": 615, "total_steps": 1040, "loss": 0.7398, "lr": 1.1508915918417567e-06, "epoch": 0.5913461538461539, "percentage": 59.13, "elapsed_time": "1:22:43", "remaining_time": "0:57:09"}
{"current_steps": 620, "total_steps": 1040, "loss": 0.941, "lr": 1.1319163062989139e-06, "epoch": 0.5961538461538461, "percentage": 59.62, "elapsed_time": "1:23:25", "remaining_time": "0:56:30"}
{"current_steps": 625, "total_steps": 1040, "loss": 0.815, "lr": 1.1132768596381337e-06, "epoch": 0.6009615384615384, "percentage": 60.1, "elapsed_time": "1:23:58", "remaining_time": "0:55:45"}
{"current_steps": 630, "total_steps": 1040, "loss": 0.8991, "lr": 1.0949712468093497e-06, "epoch": 0.6057692307692307, "percentage": 60.58, "elapsed_time": "1:24:42", "remaining_time": "0:55:07"}
{"current_steps": 635, "total_steps": 1040, "loss": 0.9282, "lr": 1.076997450646619e-06, "epoch": 0.6105769230769231, "percentage": 61.06, "elapsed_time": "1:25:28", "remaining_time": "0:54:31"}
{"current_steps": 640, "total_steps": 1040, "loss": 0.8221, "lr": 1.0593534416457847e-06, "epoch": 0.6153846153846154, "percentage": 61.54, "elapsed_time": "1:26:06", "remaining_time": "0:53:49"}
{"current_steps": 640, "total_steps": 1040, "eval_loss": 0.9404194355010986, "epoch": 0.6153846153846154, "percentage": 61.54, "elapsed_time": "1:26:27", "remaining_time": "0:54:02"}
{"current_steps": 645, "total_steps": 1040, "loss": 0.8804, "lr": 1.0420371777352623e-06, "epoch": 0.6201923076923077, "percentage": 62.02, "elapsed_time": "1:27:06", "remaining_time": "0:53:20"}
{"current_steps": 650, "total_steps": 1040, "loss": 0.7947, "lr": 1.0250466040396306e-06, "epoch": 0.625, "percentage": 62.5, "elapsed_time": "1:27:45", "remaining_time": "0:52:39"}
{"current_steps": 655, "total_steps": 1040, "loss": 0.8485, "lr": 1.0083796526357243e-06, "epoch": 0.6298076923076923, "percentage": 62.98, "elapsed_time": "1:28:19", "remaining_time": "0:51:54"}
{"current_steps": 660, "total_steps": 1040, "loss": 0.7737, "lr": 9.920342423008766e-07, "epoch": 0.6346153846153846, "percentage": 63.46, "elapsed_time": "1:29:03", "remaining_time": "0:51:16"}
{"current_steps": 665, "total_steps": 1040, "loss": 0.8044, "lr": 9.760082782529624e-07, "epoch": 0.6394230769230769, "percentage": 63.94, "elapsed_time": "1:29:40", "remaining_time": "0:50:34"}
{"current_steps": 670, "total_steps": 1040, "loss": 0.8059, "lr": 9.602996518818617e-07, "epoch": 0.6442307692307693, "percentage": 64.42, "elapsed_time": "1:30:18", "remaining_time": "0:49:52"}
{"current_steps": 675, "total_steps": 1040, "loss": 0.9736, "lr": 9.449062404719376e-07, "epoch": 0.6490384615384616, "percentage": 64.9, "elapsed_time": "1:31:07", "remaining_time": "0:49:16"}
{"current_steps": 680, "total_steps": 1040, "loss": 0.8253, "lr": 9.298259069151074e-07, "epoch": 0.6538461538461539, "percentage": 65.38, "elapsed_time": "1:31:48", "remaining_time": "0:48:36"}
{"current_steps": 685, "total_steps": 1040, "loss": 1.0807, "lr": 9.15056499414049e-07, "epoch": 0.6586538461538461, "percentage": 65.87, "elapsed_time": "1:32:43", "remaining_time": "0:48:03"}
{"current_steps": 690, "total_steps": 1040, "loss": 0.8206, "lr": 9.005958511750684e-07, "epoch": 0.6634615384615384, "percentage": 66.35, "elapsed_time": "1:33:21", "remaining_time": "0:47:21"}
{"current_steps": 695, "total_steps": 1040, "loss": 0.9496, "lr": 8.864417800901062e-07, "epoch": 0.6682692307692307, "percentage": 66.83, "elapsed_time": "1:34:06", "remaining_time": "0:46:42"}
{"current_steps": 700, "total_steps": 1040, "loss": 0.9023, "lr": 8.72592088407351e-07, "epoch": 0.6730769230769231, "percentage": 67.31, "elapsed_time": "1:34:48", "remaining_time": "0:46:03"}
{"current_steps": 705, "total_steps": 1040, "loss": 0.869, "lr": 8.590445623898662e-07, "epoch": 0.6778846153846154, "percentage": 67.79, "elapsed_time": "1:35:30", "remaining_time": "0:45:22"}
{"current_steps": 710, "total_steps": 1040, "loss": 0.9186, "lr": 8.457969719616223e-07, "epoch": 0.6826923076923077, "percentage": 68.27, "elapsed_time": "1:36:13", "remaining_time": "0:44:43"}
{"current_steps": 715, "total_steps": 1040, "loss": 0.9203, "lr": 8.32847070340265e-07, "epoch": 0.6875, "percentage": 68.75, "elapsed_time": "1:36:54", "remaining_time": "0:44:02"}
{"current_steps": 720, "total_steps": 1040, "loss": 0.9417, "lr": 8.201925936559198e-07, "epoch": 0.6923076923076923, "percentage": 69.23, "elapsed_time": "1:37:39", "remaining_time": "0:43:24"}
{"current_steps": 720, "total_steps": 1040, "eval_loss": 0.9345305562019348, "epoch": 0.6923076923076923, "percentage": 69.23, "elapsed_time": "1:38:00", "remaining_time": "0:43:33"}
{"current_steps": 725, "total_steps": 1040, "loss": 0.9107, "lr": 8.078312605552745e-07, "epoch": 0.6971153846153846, "percentage": 69.71, "elapsed_time": "1:38:54", "remaining_time": "0:42:58"}
{"current_steps": 730, "total_steps": 1040, "loss": 0.9438, "lr": 7.957607717901299e-07, "epoch": 0.7019230769230769, "percentage": 70.19, "elapsed_time": "1:39:42", "remaining_time": "0:42:20"}
{"current_steps": 735, "total_steps": 1040, "loss": 0.8693, "lr": 7.839788097895564e-07, "epoch": 0.7067307692307693, "percentage": 70.67, "elapsed_time": "1:40:18", "remaining_time": "0:41:37"}
{"current_steps": 740, "total_steps": 1040, "loss": 0.896, "lr": 7.72483038214722e-07, "epoch": 0.7115384615384616, "percentage": 71.15, "elapsed_time": "1:41:05", "remaining_time": "0:40:58"}
{"current_steps": 745, "total_steps": 1040, "loss": 0.8243, "lr": 7.612711014953991e-07, "epoch": 0.7163461538461539, "percentage": 71.63, "elapsed_time": "1:41:40", "remaining_time": "0:40:15"}
{"current_steps": 750, "total_steps": 1040, "loss": 1.0063, "lr": 7.503406243470673e-07, "epoch": 0.7211538461538461, "percentage": 72.12, "elapsed_time": "1:42:29", "remaining_time": "0:39:37"}
{"current_steps": 755, "total_steps": 1040, "loss": 0.8133, "lr": 7.396892112674676e-07, "epoch": 0.7259615384615384, "percentage": 72.6, "elapsed_time": "1:43:13", "remaining_time": "0:38:58"}
{"current_steps": 760, "total_steps": 1040, "loss": 0.8753, "lr": 7.293144460113513e-07, "epoch": 0.7307692307692307, "percentage": 73.08, "elapsed_time": "1:43:56", "remaining_time": "0:38:17"}
{"current_steps": 765, "total_steps": 1040, "loss": 0.8277, "lr": 7.192138910420856e-07, "epoch": 0.7355769230769231, "percentage": 73.56, "elapsed_time": "1:44:43", "remaining_time": "0:37:38"}
{"current_steps": 770, "total_steps": 1040, "loss": 0.8746, "lr": 7.093850869586572e-07, "epoch": 0.7403846153846154, "percentage": 74.04, "elapsed_time": "1:45:31", "remaining_time": "0:37:00"}
{"current_steps": 775, "total_steps": 1040, "loss": 0.8711, "lr": 6.998255518965055e-07, "epoch": 0.7451923076923077, "percentage": 74.52, "elapsed_time": "1:46:16", "remaining_time": "0:36:20"}
{"current_steps": 780, "total_steps": 1040, "loss": 0.8073, "lr": 6.905327809004765e-07, "epoch": 0.75, "percentage": 75.0, "elapsed_time": "1:47:05", "remaining_time": "0:35:41"}
{"current_steps": 785, "total_steps": 1040, "loss": 0.852, "lr": 6.815042452680482e-07, "epoch": 0.7548076923076923, "percentage": 75.48, "elapsed_time": "1:47:48", "remaining_time": "0:35:01"}
{"current_steps": 790, "total_steps": 1040, "loss": 0.7941, "lr": 6.727373918608166e-07, "epoch": 0.7596153846153846, "percentage": 75.96, "elapsed_time": "1:48:26", "remaining_time": "0:34:18"}
{"current_steps": 795, "total_steps": 1040, "loss": 0.8553, "lr": 6.642296423820508e-07, "epoch": 0.7644230769230769, "percentage": 76.44, "elapsed_time": "1:49:03", "remaining_time": "0:33:36"}
{"current_steps": 800, "total_steps": 1040, "loss": 0.9623, "lr": 6.559783926179307e-07, "epoch": 0.7692307692307693, "percentage": 76.92, "elapsed_time": "1:49:56", "remaining_time": "0:32:58"}
{"current_steps": 800, "total_steps": 1040, "eval_loss": 0.9317355155944824, "epoch": 0.7692307692307693, "percentage": 76.92, "elapsed_time": "1:50:17", "remaining_time": "0:33:05"}
{"current_steps": 805, "total_steps": 1040, "loss": 0.9048, "lr": 6.479810116398562e-07, "epoch": 0.7740384615384616, "percentage": 77.4, "elapsed_time": "1:50:55", "remaining_time": "0:32:22"}
{"current_steps": 810, "total_steps": 1040, "loss": 0.7535, "lr": 6.40234840964976e-07, "epoch": 0.7788461538461539, "percentage": 77.88, "elapsed_time": "1:51:40", "remaining_time": "0:31:42"}
{"current_steps": 815, "total_steps": 1040, "loss": 0.8606, "lr": 6.327371936718024e-07, "epoch": 0.7836538461538461, "percentage": 78.37, "elapsed_time": "1:52:24", "remaining_time": "0:31:02"}
{"current_steps": 820, "total_steps": 1040, "loss": 0.8133, "lr": 6.254853534674779e-07, "epoch": 0.7884615384615384, "percentage": 78.85, "elapsed_time": "1:53:07", "remaining_time": "0:30:20"}
{"current_steps": 825, "total_steps": 1040, "loss": 0.921, "lr": 6.184765737029068e-07, "epoch": 0.7932692307692307, "percentage": 79.33, "elapsed_time": "1:54:14", "remaining_time": "0:29:46"}
{"current_steps": 830, "total_steps": 1040, "loss": 0.8378, "lr": 6.117080763315794e-07, "epoch": 0.7980769230769231, "percentage": 79.81, "elapsed_time": "1:55:00", "remaining_time": "0:29:05"}
{"current_steps": 835, "total_steps": 1040, "loss": 0.7412, "lr": 6.051770508074766e-07, "epoch": 0.8028846153846154, "percentage": 80.29, "elapsed_time": "1:55:35", "remaining_time": "0:28:22"}
{"current_steps": 840, "total_steps": 1040, "loss": 0.8488, "lr": 5.98880652916942e-07, "epoch": 0.8076923076923077, "percentage": 80.77, "elapsed_time": "1:56:16", "remaining_time": "0:27:41"}
{"current_steps": 845, "total_steps": 1040, "loss": 0.7888, "lr": 5.928160035388477e-07, "epoch": 0.8125, "percentage": 81.25, "elapsed_time": "1:57:07", "remaining_time": "0:27:01"}
{"current_steps": 850, "total_steps": 1040, "loss": 0.9896, "lr": 5.869801873267336e-07, "epoch": 0.8173076923076923, "percentage": 81.73, "elapsed_time": "1:57:47", "remaining_time": "0:26:19"}
{"current_steps": 855, "total_steps": 1040, "loss": 0.7731, "lr": 5.813702513058679e-07, "epoch": 0.8221153846153846, "percentage": 82.21, "elapsed_time": "1:58:25", "remaining_time": "0:25:37"}
{"current_steps": 860, "total_steps": 1040, "loss": 0.9015, "lr": 5.759832033773325e-07, "epoch": 0.8269230769230769, "percentage": 82.69, "elapsed_time": "1:59:12", "remaining_time": "0:24:56"}
{"current_steps": 865, "total_steps": 1040, "loss": 0.8423, "lr": 5.708160107202719e-07, "epoch": 0.8317307692307693, "percentage": 83.17, "elapsed_time": "1:59:49", "remaining_time": "0:24:14"}
{"current_steps": 870, "total_steps": 1040, "loss": 0.8807, "lr": 5.658655980823239e-07, "epoch": 0.8365384615384616, "percentage": 83.65, "elapsed_time": "2:00:32", "remaining_time": "0:23:33"}
{"current_steps": 875, "total_steps": 1040, "loss": 0.8609, "lr": 5.611288459469594e-07, "epoch": 0.8413461538461539, "percentage": 84.13, "elapsed_time": "2:01:12", "remaining_time": "0:22:51"}
{"current_steps": 880, "total_steps": 1040, "loss": 0.9654, "lr": 5.566025885649524e-07, "epoch": 0.8461538461538461, "percentage": 84.62, "elapsed_time": "2:01:53", "remaining_time": "0:22:09"}
{"current_steps": 880, "total_steps": 1040, "eval_loss": 0.9302033185958862, "epoch": 0.8461538461538461, "percentage": 84.62, "elapsed_time": "2:02:14", "remaining_time": "0:22:13"}
{"current_steps": 885, "total_steps": 1040, "loss": 0.7406, "lr": 5.522836118354419e-07, "epoch": 0.8509615384615384, "percentage": 85.1, "elapsed_time": "2:03:05", "remaining_time": "0:21:33"}
{"current_steps": 890, "total_steps": 1040, "loss": 0.9893, "lr": 5.481686510199858e-07, "epoch": 0.8557692307692307, "percentage": 85.58, "elapsed_time": "2:03:55", "remaining_time": "0:20:53"}
{"current_steps": 895, "total_steps": 1040, "loss": 0.9432, "lr": 5.442543882705713e-07, "epoch": 0.8605769230769231, "percentage": 86.06, "elapsed_time": "2:04:54", "remaining_time": "0:20:14"}
{"current_steps": 900, "total_steps": 1040, "loss": 0.8199, "lr": 5.405374499496658e-07, "epoch": 0.8653846153846154, "percentage": 86.54, "elapsed_time": "2:05:42", "remaining_time": "0:19:33"}
{"current_steps": 905, "total_steps": 1040, "loss": 0.8742, "lr": 5.370144037169503e-07, "epoch": 0.8701923076923077, "percentage": 87.02, "elapsed_time": "2:06:31", "remaining_time": "0:18:52"}
{"current_steps": 910, "total_steps": 1040, "loss": 0.8431, "lr": 5.336817553532644e-07, "epoch": 0.875, "percentage": 87.5, "elapsed_time": "2:07:19", "remaining_time": "0:18:11"}
{"current_steps": 915, "total_steps": 1040, "loss": 0.8947, "lr": 5.305359452873153e-07, "epoch": 0.8798076923076923, "percentage": 87.98, "elapsed_time": "2:08:07", "remaining_time": "0:17:30"}
{"current_steps": 920, "total_steps": 1040, "loss": 0.7263, "lr": 5.275733447846792e-07, "epoch": 0.8846153846153846, "percentage": 88.46, "elapsed_time": "2:08:49", "remaining_time": "0:16:48"}
{"current_steps": 925, "total_steps": 1040, "loss": 0.8365, "lr": 5.247902517512378e-07, "epoch": 0.8894230769230769, "percentage": 88.94, "elapsed_time": "2:09:34", "remaining_time": "0:16:06"}
{"current_steps": 930, "total_steps": 1040, "loss": 1.0223, "lr": 5.221828860941111e-07, "epoch": 0.8942307692307693, "percentage": 89.42, "elapsed_time": "2:10:21", "remaining_time": "0:15:25"}
{"current_steps": 935, "total_steps": 1040, "loss": 0.8666, "lr": 5.197473845718411e-07, "epoch": 0.8990384615384616, "percentage": 89.9, "elapsed_time": "2:11:06", "remaining_time": "0:14:43"}
{"current_steps": 940, "total_steps": 1040, "loss": 0.7097, "lr": 5.174797950514308e-07, "epoch": 0.9038461538461539, "percentage": 90.38, "elapsed_time": "2:11:43", "remaining_time": "0:14:00"}
{"current_steps": 945, "total_steps": 1040, "loss": 0.9475, "lr": 5.153760700719024e-07, "epoch": 0.9086538461538461, "percentage": 90.87, "elapsed_time": "2:12:31", "remaining_time": "0:13:19"}
{"current_steps": 950, "total_steps": 1040, "loss": 0.8123, "lr": 5.13432059591097e-07, "epoch": 0.9134615384615384, "percentage": 91.35, "elapsed_time": "2:13:09", "remaining_time": "0:12:36"}
{"current_steps": 955, "total_steps": 1040, "loss": 0.8134, "lr": 5.116435027627297e-07, "epoch": 0.9182692307692307, "percentage": 91.83, "elapsed_time": "2:13:52", "remaining_time": "0:11:54"}
{"current_steps": 960, "total_steps": 1040, "loss": 0.9169, "lr": 5.100060185517474e-07, "epoch": 0.9230769230769231, "percentage": 92.31, "elapsed_time": "2:14:49", "remaining_time": "0:11:14"}
{"current_steps": 960, "total_steps": 1040, "eval_loss": 0.928638756275177, "epoch": 0.9230769230769231, "percentage": 92.31, "elapsed_time": "2:15:10", "remaining_time": "0:11:15"}
{"current_steps": 965, "total_steps": 1040, "loss": 0.7718, "lr": 5.085150949442101e-07, "epoch": 0.9278846153846154, "percentage": 92.79, "elapsed_time": "2:15:56", "remaining_time": "0:10:33"}
{"current_steps": 970, "total_steps": 1040, "loss": 0.9096, "lr": 5.071660764378547e-07, "epoch": 0.9326923076923077, "percentage": 93.27, "elapsed_time": "2:17:03", "remaining_time": "0:09:53"}
{"current_steps": 975, "total_steps": 1040, "loss": 0.8835, "lr": 5.059541494031398e-07, "epoch": 0.9375, "percentage": 93.75, "elapsed_time": "2:18:04", "remaining_time": "0:09:12"}
{"current_steps": 980, "total_steps": 1040, "loss": 0.8909, "lr": 5.048743247693103e-07, "epoch": 0.9423076923076923, "percentage": 94.23, "elapsed_time": "2:19:26", "remaining_time": "0:08:32"}
{"current_steps": 985, "total_steps": 1040, "loss": 0.8688, "lr": 5.039214172958587e-07, "epoch": 0.9471153846153846, "percentage": 94.71, "elapsed_time": "2:20:16", "remaining_time": "0:07:49"}
{"current_steps": 990, "total_steps": 1040, "loss": 0.8714, "lr": 5.030900204036544e-07, "epoch": 0.9519230769230769, "percentage": 95.19, "elapsed_time": "2:21:02", "remaining_time": "0:07:07"}
{"current_steps": 995, "total_steps": 1040, "loss": 0.9248, "lr": 5.023744751055416e-07, "epoch": 0.9567307692307693, "percentage": 95.67, "elapsed_time": "2:22:03", "remaining_time": "0:06:25"}
{"current_steps": 1000, "total_steps": 1040, "loss": 0.8965, "lr": 5.017688308926548e-07, "epoch": 0.9615384615384616, "percentage": 96.15, "elapsed_time": "2:23:03", "remaining_time": "0:05:43"}
{"current_steps": 1005, "total_steps": 1040, "loss": 0.8606, "lr": 5.012667953109271e-07, "epoch": 0.9663461538461539, "percentage": 96.63, "elapsed_time": "2:23:49", "remaining_time": "0:05:00"}
{"current_steps": 1010, "total_steps": 1040, "loss": 0.8847, "lr": 5.008616670245212e-07, "epoch": 0.9711538461538461, "percentage": 97.12, "elapsed_time": "2:25:12", "remaining_time": "0:04:18"}
{"current_steps": 1015, "total_steps": 1040, "loss": 0.7237, "lr": 5.005462435953572e-07, "epoch": 0.9759615384615384, "percentage": 97.6, "elapsed_time": "2:25:58", "remaining_time": "0:03:35"}
{"current_steps": 1020, "total_steps": 1040, "loss": 0.9875, "lr": 5.003126880797421e-07, "epoch": 0.9807692307692307, "percentage": 98.08, "elapsed_time": "2:27:13", "remaining_time": "0:02:53"}
{"current_steps": 1025, "total_steps": 1040, "loss": 0.8558, "lr": 5.00152322649041e-07, "epoch": 0.9855769230769231, "percentage": 98.56, "elapsed_time": "2:28:16", "remaining_time": "0:02:10"}
{"current_steps": 1030, "total_steps": 1040, "loss": 0.6462, "lr": 5.000552759653955e-07, "epoch": 0.9903846153846154, "percentage": 99.04, "elapsed_time": "2:29:20", "remaining_time": "0:01:26"}
{"current_steps": 1035, "total_steps": 1040, "loss": 0.7703, "lr": 5.000097715024919e-07, "epoch": 0.9951923076923077, "percentage": 99.52, "elapsed_time": "2:30:14", "remaining_time": "0:00:43"}
{"current_steps": 1040, "total_steps": 1040, "loss": 0.9005, "lr": 5e-07, "epoch": 1.0, "percentage": 100.0, "elapsed_time": "2:31:17", "remaining_time": "0:00:00"}
{"current_steps": 1040, "total_steps": 1040, "eval_loss": 0.9287646412849426, "epoch": 1.0, "percentage": 100.0, "elapsed_time": "2:31:39", "remaining_time": "0:00:00"}
{"current_steps": 1040, "total_steps": 1040, "epoch": 1.0, "percentage": 100.0, "elapsed_time": "2:32:36", "remaining_time": "0:00:00"}