{"current_steps": 100, "total_steps": 93654, "loss": 1.2173, "learning_rate": 5e-06, "epoch": 0.003203280158882696, "percentage": 0.11, "elapsed_time": "0:18:27", "remaining_time": "11 days, 23:56:07", "throughput": 739.36, "total_tokens": 819200} {"current_steps": 200, "total_steps": 93654, "loss": 1.1953, "learning_rate": 1e-05, "epoch": 0.006406560317765392, "percentage": 0.21, "elapsed_time": "0:32:00", "remaining_time": "10 days, 9:15:33", "throughput": 853.17, "total_tokens": 1638400} {"current_steps": 300, "total_steps": 93654, "loss": 1.1905, "learning_rate": 1.5e-05, "epoch": 0.009609840476648087, "percentage": 0.32, "elapsed_time": "0:41:39", "remaining_time": "9 days, 0:02:41", "throughput": 983.28, "total_tokens": 2457600} {"current_steps": 400, "total_steps": 93654, "loss": 1.1391, "learning_rate": 2e-05, "epoch": 0.012813120635530783, "percentage": 0.43, "elapsed_time": "0:52:20", "remaining_time": "8 days, 11:23:31", "throughput": 1043.33, "total_tokens": 3276800} {"current_steps": 500, "total_steps": 93654, "loss": 1.1383, "learning_rate": 2.5e-05, "epoch": 0.01601640079441348, "percentage": 0.53, "elapsed_time": "1:12:06", "remaining_time": "9 days, 7:54:49", "throughput": 946.69, "total_tokens": 4096000} {"current_steps": 600, "total_steps": 93654, "loss": 1.1022, "learning_rate": 3e-05, "epoch": 0.019219680953296174, "percentage": 0.64, "elapsed_time": "1:21:08", "remaining_time": "8 days, 17:44:45", "throughput": 1009.55, "total_tokens": 4915200} {"current_steps": 700, "total_steps": 93654, "loss": 1.0805, "learning_rate": 3.5e-05, "epoch": 0.022422961112178872, "percentage": 0.75, "elapsed_time": "1:30:09", "remaining_time": "8 days, 7:31:52", "throughput": 1060.09, "total_tokens": 5734400} {"current_steps": 800, "total_steps": 93654, "loss": 1.0755, "learning_rate": 4e-05, "epoch": 0.025626241271061567, "percentage": 0.85, "elapsed_time": "1:39:08", "remaining_time": "7 days, 23:46:42", "throughput": 1101.76, "total_tokens": 6553600} {"current_steps": 900, "total_steps": 93654, "loss": 1.0995, "learning_rate": 4.5e-05, "epoch": 0.028829521429944265, "percentage": 0.96, "elapsed_time": "1:47:35", "remaining_time": "7 days, 16:48:24", "throughput": 1142.09, "total_tokens": 7372800} {"current_steps": 1000, "total_steps": 93654, "loss": 1.0835, "learning_rate": 5e-05, "epoch": 0.03203280158882696, "percentage": 1.07, "elapsed_time": "1:55:52", "remaining_time": "7 days, 10:56:47", "throughput": 1178.23, "total_tokens": 8192000} {"current_steps": 1100, "total_steps": 93654, "loss": 1.0848, "learning_rate": 4.9999856291983216e-05, "epoch": 0.035236081747709654, "percentage": 1.17, "elapsed_time": "2:04:02", "remaining_time": "7 days, 5:56:19", "throughput": 1210.84, "total_tokens": 9011200} {"current_steps": 1200, "total_steps": 93654, "loss": 1.0621, "learning_rate": 4.9999425169585025e-05, "epoch": 0.03843936190659235, "percentage": 1.28, "elapsed_time": "2:11:56", "remaining_time": "7 days, 1:25:52", "throughput": 1241.71, "total_tokens": 9830400} {"current_steps": 1300, "total_steps": 93654, "loss": 1.0774, "learning_rate": 4.999870663776188e-05, "epoch": 0.04164264206547505, "percentage": 1.39, "elapsed_time": "2:19:55", "remaining_time": "6 days, 21:40:13", "throughput": 1268.52, "total_tokens": 10649600} {"current_steps": 1400, "total_steps": 93654, "loss": 1.0204, "learning_rate": 4.99977007047745e-05, "epoch": 0.044845922224357744, "percentage": 1.49, "elapsed_time": "2:27:49", "remaining_time": "6 days, 18:20:34", "throughput": 1293.12, "total_tokens": 11468800} {"current_steps": 1500, "total_steps": 93654, "loss": 1.0509, "learning_rate": 4.999640738218772e-05, "epoch": 0.04804920238324044, "percentage": 1.6, "elapsed_time": "2:35:38", "remaining_time": "6 days, 15:22:26", "throughput": 1315.78, "total_tokens": 12288000} {"current_steps": 1600, "total_steps": 93654, "loss": 1.1401, "learning_rate": 4.99948266848704e-05, "epoch": 0.05125248254212313, "percentage": 1.71, "elapsed_time": "2:43:34", "remaining_time": "6 days, 12:51:13", "throughput": 1335.47, "total_tokens": 13107200} {"current_steps": 1700, "total_steps": 93654, "loss": 1.042, "learning_rate": 4.999295863099528e-05, "epoch": 0.05445576270100583, "percentage": 1.82, "elapsed_time": "2:51:18", "remaining_time": "6 days, 10:26:03", "throughput": 1354.92, "total_tokens": 13926400} {"current_steps": 1800, "total_steps": 93654, "loss": 1.1398, "learning_rate": 4.999080324203867e-05, "epoch": 0.05765904285988853, "percentage": 1.92, "elapsed_time": "2:59:05", "remaining_time": "6 days, 8:18:41", "throughput": 1372.31, "total_tokens": 14745600} {"current_steps": 1900, "total_steps": 93654, "loss": 1.0759, "learning_rate": 4.9988360542780333e-05, "epoch": 0.060862323018771224, "percentage": 2.03, "elapsed_time": "3:06:49", "remaining_time": "6 days, 6:22:25", "throughput": 1388.48, "total_tokens": 15564800} {"current_steps": 2000, "total_steps": 93654, "loss": 1.0988, "learning_rate": 4.998563056130308e-05, "epoch": 0.06406560317765392, "percentage": 2.14, "elapsed_time": "3:14:38", "remaining_time": "6 days, 4:39:29", "throughput": 1402.98, "total_tokens": 16384000} {"current_steps": 2100, "total_steps": 93654, "loss": 1.0642, "learning_rate": 4.998261332899255e-05, "epoch": 0.06726888333653662, "percentage": 2.24, "elapsed_time": "3:22:25", "remaining_time": "6 days, 3:05:00", "throughput": 1416.45, "total_tokens": 17203200} {"current_steps": 2200, "total_steps": 93654, "loss": 1.076, "learning_rate": 4.997930888053677e-05, "epoch": 0.07047216349541931, "percentage": 2.35, "elapsed_time": "3:30:17", "remaining_time": "6 days, 1:41:28", "throughput": 1428.42, "total_tokens": 18022400} {"current_steps": 2300, "total_steps": 93654, "loss": 1.0616, "learning_rate": 4.99757172539258e-05, "epoch": 0.07367544365430201, "percentage": 2.46, "elapsed_time": "3:38:08", "remaining_time": "6 days, 0:24:16", "throughput": 1439.57, "total_tokens": 18841600} {"current_steps": 2400, "total_steps": 93654, "loss": 1.0691, "learning_rate": 4.997183849045129e-05, "epoch": 0.0768787238131847, "percentage": 2.56, "elapsed_time": "3:46:00", "remaining_time": "5 days, 23:13:39", "throughput": 1449.81, "total_tokens": 19660800} {"current_steps": 2500, "total_steps": 93654, "loss": 1.0463, "learning_rate": 4.996767263470599e-05, "epoch": 0.0800820039720674, "percentage": 2.67, "elapsed_time": "3:53:52", "remaining_time": "5 days, 22:07:37", "throughput": 1459.44, "total_tokens": 20480000} {"current_steps": 2600, "total_steps": 93654, "loss": 1.0703, "learning_rate": 4.996321973458325e-05, "epoch": 0.0832852841309501, "percentage": 2.78, "elapsed_time": "4:01:46", "remaining_time": "5 days, 21:06:52", "throughput": 1468.3, "total_tokens": 21299200} {"current_steps": 2700, "total_steps": 93654, "loss": 1.0397, "learning_rate": 4.9958479841276446e-05, "epoch": 0.08648856428983279, "percentage": 2.88, "elapsed_time": "4:09:37", "remaining_time": "5 days, 20:09:08", "throughput": 1476.76, "total_tokens": 22118400} {"current_steps": 2800, "total_steps": 93654, "loss": 1.0837, "learning_rate": 4.995345300927845e-05, "epoch": 0.08969184444871549, "percentage": 2.99, "elapsed_time": "4:17:30", "remaining_time": "5 days, 19:15:41", "throughput": 1484.57, "total_tokens": 22937600} {"current_steps": 2900, "total_steps": 93654, "loss": 1.0399, "learning_rate": 4.994813929638096e-05, "epoch": 0.09289512460759818, "percentage": 3.1, "elapsed_time": "4:25:23", "remaining_time": "5 days, 18:25:15", "throughput": 1491.94, "total_tokens": 23756800} {"current_steps": 3000, "total_steps": 93654, "loss": 1.0634, "learning_rate": 4.9942538763673794e-05, "epoch": 0.09609840476648088, "percentage": 3.2, "elapsed_time": "4:33:15", "remaining_time": "5 days, 17:37:32", "throughput": 1498.91, "total_tokens": 24576000} {"current_steps": 3100, "total_steps": 93654, "loss": 1.0472, "learning_rate": 4.993665147554429e-05, "epoch": 0.09930168492536358, "percentage": 3.31, "elapsed_time": "4:41:08", "remaining_time": "5 days, 16:52:39", "throughput": 1505.44, "total_tokens": 25395200} {"current_steps": 3200, "total_steps": 93654, "loss": 1.0774, "learning_rate": 4.9930477499676495e-05, "epoch": 0.10250496508424627, "percentage": 3.42, "elapsed_time": "4:49:00", "remaining_time": "5 days, 16:09:34", "throughput": 1511.71, "total_tokens": 26214400} {"current_steps": 3300, "total_steps": 93654, "loss": 1.0402, "learning_rate": 4.992401690705038e-05, "epoch": 0.10570824524312897, "percentage": 3.52, "elapsed_time": "4:56:54", "remaining_time": "5 days, 15:29:15", "throughput": 1517.52, "total_tokens": 27033600} {"current_steps": 3400, "total_steps": 93654, "loss": 1.0353, "learning_rate": 4.9917269771941056e-05, "epoch": 0.10891152540201166, "percentage": 3.63, "elapsed_time": "5:04:45", "remaining_time": "5 days, 14:50:02", "throughput": 1523.19, "total_tokens": 27852800} {"current_steps": 3500, "total_steps": 93654, "loss": 1.0776, "learning_rate": 4.991023617191792e-05, "epoch": 0.11211480556089436, "percentage": 3.74, "elapsed_time": "5:12:38", "remaining_time": "5 days, 14:13:06", "throughput": 1528.48, "total_tokens": 28672000} {"current_steps": 3600, "total_steps": 93654, "loss": 1.1083, "learning_rate": 4.990291618784377e-05, "epoch": 0.11531808571977706, "percentage": 3.84, "elapsed_time": "5:20:31", "remaining_time": "5 days, 13:38:05", "throughput": 1533.45, "total_tokens": 29491200} {"current_steps": 3700, "total_steps": 93654, "loss": 1.0262, "learning_rate": 4.989530990387381e-05, "epoch": 0.11852136587865975, "percentage": 3.95, "elapsed_time": "5:28:24", "remaining_time": "5 days, 13:04:23", "throughput": 1538.22, "total_tokens": 30310400} {"current_steps": 3800, "total_steps": 93654, "loss": 1.0441, "learning_rate": 4.988741740745477e-05, "epoch": 0.12172464603754245, "percentage": 4.06, "elapsed_time": "5:36:16", "remaining_time": "5 days, 12:31:36", "throughput": 1542.84, "total_tokens": 31129600} {"current_steps": 3900, "total_steps": 93654, "loss": 1.0375, "learning_rate": 4.987923878932386e-05, "epoch": 0.12492792619642513, "percentage": 4.16, "elapsed_time": "5:44:09", "remaining_time": "5 days, 12:00:15", "throughput": 1547.23, "total_tokens": 31948800} {"current_steps": 4000, "total_steps": 93654, "loss": 1.0041, "learning_rate": 4.9870774143507696e-05, "epoch": 0.12813120635530784, "percentage": 4.27, "elapsed_time": "5:52:01", "remaining_time": "5 days, 11:30:10", "throughput": 1551.39, "total_tokens": 32768000} {"current_steps": 4100, "total_steps": 93654, "loss": 1.0798, "learning_rate": 4.98620235673213e-05, "epoch": 0.13133448651419052, "percentage": 4.38, "elapsed_time": "5:59:57", "remaining_time": "5 days, 11:02:16", "throughput": 1555.16, "total_tokens": 33587200} {"current_steps": 4200, "total_steps": 93654, "loss": 1.1014, "learning_rate": 4.9852987161366895e-05, "epoch": 0.13453776667307324, "percentage": 4.48, "elapsed_time": "6:07:53", "remaining_time": "5 days, 10:35:34", "throughput": 1558.72, "total_tokens": 34406400} {"current_steps": 4300, "total_steps": 93654, "loss": 1.0321, "learning_rate": 4.9843665029532796e-05, "epoch": 0.13774104683195593, "percentage": 4.59, "elapsed_time": "6:15:44", "remaining_time": "5 days, 10:07:57", "throughput": 1562.48, "total_tokens": 35225600} {"current_steps": 4400, "total_steps": 93654, "loss": 0.9954, "learning_rate": 4.983405727899221e-05, "epoch": 0.14094432699083861, "percentage": 4.7, "elapsed_time": "6:23:37", "remaining_time": "5 days, 9:41:58", "throughput": 1565.95, "total_tokens": 36044800} {"current_steps": 4500, "total_steps": 93654, "loss": 1.0049, "learning_rate": 4.982416402020201e-05, "epoch": 0.1441476071497213, "percentage": 4.8, "elapsed_time": "6:31:29", "remaining_time": "5 days, 9:16:23", "throughput": 1569.35, "total_tokens": 36864000} {"current_steps": 4600, "total_steps": 93654, "loss": 1.0586, "learning_rate": 4.9813985366901435e-05, "epoch": 0.14735088730860402, "percentage": 4.91, "elapsed_time": "6:39:24", "remaining_time": "5 days, 8:52:15", "throughput": 1572.48, "total_tokens": 37683200} {"current_steps": 4700, "total_steps": 93654, "loss": 1.0949, "learning_rate": 4.980352143611081e-05, "epoch": 0.1505541674674867, "percentage": 5.02, "elapsed_time": "6:47:18", "remaining_time": "5 days, 8:29:01", "throughput": 1575.45, "total_tokens": 38502400} {"current_steps": 4800, "total_steps": 93654, "loss": 1.0374, "learning_rate": 4.979277234813021e-05, "epoch": 0.1537574476263694, "percentage": 5.13, "elapsed_time": "6:55:12", "remaining_time": "5 days, 8:06:10", "throughput": 1578.36, "total_tokens": 39321600} {"current_steps": 4900, "total_steps": 93654, "loss": 1.0195, "learning_rate": 4.978173822653802e-05, "epoch": 0.1569607277852521, "percentage": 5.23, "elapsed_time": "7:03:04", "remaining_time": "5 days, 7:43:05", "throughput": 1581.33, "total_tokens": 40140800} {"current_steps": 5000, "total_steps": 93654, "loss": 1.0661, "learning_rate": 4.9770419198189595e-05, "epoch": 0.1601640079441348, "percentage": 5.34, "elapsed_time": "7:10:55", "remaining_time": "5 days, 7:20:43", "throughput": 1584.17, "total_tokens": 40960000} {"current_steps": 5100, "total_steps": 93654, "loss": 1.0168, "learning_rate": 4.975881539321574e-05, "epoch": 0.16336728810301748, "percentage": 5.45, "elapsed_time": "7:18:49", "remaining_time": "5 days, 6:59:38", "throughput": 1586.76, "total_tokens": 41779200} {"current_steps": 5200, "total_steps": 93654, "loss": 1.0523, "learning_rate": 4.974692694502123e-05, "epoch": 0.1665705682619002, "percentage": 5.55, "elapsed_time": "7:26:42", "remaining_time": "5 days, 6:38:33", "throughput": 1589.37, "total_tokens": 42598400} {"current_steps": 5300, "total_steps": 93654, "loss": 1.0294, "learning_rate": 4.973475399028331e-05, "epoch": 0.16977384842078289, "percentage": 5.66, "elapsed_time": "7:34:35", "remaining_time": "5 days, 6:18:21", "throughput": 1591.8, "total_tokens": 43417600} {"current_steps": 5400, "total_steps": 93654, "loss": 0.9866, "learning_rate": 4.972229666895006e-05, "epoch": 0.17297712857966557, "percentage": 5.77, "elapsed_time": "7:42:26", "remaining_time": "5 days, 5:57:52", "throughput": 1594.31, "total_tokens": 44236800} {"current_steps": 5500, "total_steps": 93654, "loss": 0.99, "learning_rate": 4.970955512423884e-05, "epoch": 0.17618040873854826, "percentage": 5.87, "elapsed_time": "7:50:17", "remaining_time": "5 days, 5:37:55", "throughput": 1596.72, "total_tokens": 45056000} {"current_steps": 5600, "total_steps": 93654, "loss": 1.0292, "learning_rate": 4.969652950263462e-05, "epoch": 0.17938368889743098, "percentage": 5.98, "elapsed_time": "7:58:10", "remaining_time": "5 days, 5:18:39", "throughput": 1599.0, "total_tokens": 45875200} {"current_steps": 5700, "total_steps": 93654, "loss": 1.0712, "learning_rate": 4.96832199538883e-05, "epoch": 0.18258696905631366, "percentage": 6.09, "elapsed_time": "8:06:02", "remaining_time": "5 days, 4:59:59", "throughput": 1601.16, "total_tokens": 46694400} {"current_steps": 5800, "total_steps": 93654, "loss": 1.0279, "learning_rate": 4.966962663101499e-05, "epoch": 0.18579024921519635, "percentage": 6.19, "elapsed_time": "8:13:56", "remaining_time": "5 days, 4:41:49", "throughput": 1603.22, "total_tokens": 47513600} {"current_steps": 5900, "total_steps": 93654, "loss": 1.0448, "learning_rate": 4.965574969029223e-05, "epoch": 0.18899352937407907, "percentage": 6.3, "elapsed_time": "8:21:50", "remaining_time": "5 days, 4:24:03", "throughput": 1605.2, "total_tokens": 48332800} {"current_steps": 6000, "total_steps": 93654, "loss": 1.0492, "learning_rate": 4.9641589291258255e-05, "epoch": 0.19219680953296175, "percentage": 6.41, "elapsed_time": "8:29:42", "remaining_time": "5 days, 4:06:21", "throughput": 1607.19, "total_tokens": 49152000} {"current_steps": 6100, "total_steps": 93654, "loss": 1.0593, "learning_rate": 4.962714559671008e-05, "epoch": 0.19540008969184444, "percentage": 6.51, "elapsed_time": "8:37:36", "remaining_time": "5 days, 3:49:15", "throughput": 1609.05, "total_tokens": 49971200} {"current_steps": 6200, "total_steps": 93654, "loss": 1.0054, "learning_rate": 4.961241877270169e-05, "epoch": 0.19860336985072716, "percentage": 6.62, "elapsed_time": "8:45:27", "remaining_time": "5 days, 3:31:56", "throughput": 1610.97, "total_tokens": 50790400} {"current_steps": 6300, "total_steps": 93654, "loss": 0.9865, "learning_rate": 4.9597408988542096e-05, "epoch": 0.20180665000960984, "percentage": 6.73, "elapsed_time": "8:53:18", "remaining_time": "5 days, 3:14:48", "throughput": 1612.85, "total_tokens": 51609600} {"current_steps": 6400, "total_steps": 93654, "loss": 1.0529, "learning_rate": 4.958211641679339e-05, "epoch": 0.20500993016849253, "percentage": 6.83, "elapsed_time": "9:01:11", "remaining_time": "5 days, 2:58:11", "throughput": 1614.63, "total_tokens": 52428800} {"current_steps": 6500, "total_steps": 93654, "loss": 1.0272, "learning_rate": 4.956654123326881e-05, "epoch": 0.20821321032737522, "percentage": 6.94, "elapsed_time": "9:09:02", "remaining_time": "5 days, 2:41:47", "throughput": 1616.37, "total_tokens": 53248000} {"current_steps": 6600, "total_steps": 93654, "loss": 1.0295, "learning_rate": 4.9550683617030624e-05, "epoch": 0.21141649048625794, "percentage": 7.05, "elapsed_time": "9:16:55", "remaining_time": "5 days, 2:25:43", "throughput": 1618.05, "total_tokens": 54067200} {"current_steps": 6700, "total_steps": 93654, "loss": 0.9849, "learning_rate": 4.9534543750388185e-05, "epoch": 0.21461977064514062, "percentage": 7.15, "elapsed_time": "9:24:46", "remaining_time": "5 days, 2:09:39", "throughput": 1619.74, "total_tokens": 54886400} {"current_steps": 6800, "total_steps": 93654, "loss": 0.9597, "learning_rate": 4.951812181889573e-05, "epoch": 0.2178230508040233, "percentage": 7.26, "elapsed_time": "9:32:37", "remaining_time": "5 days, 1:53:57", "throughput": 1621.35, "total_tokens": 55705600} {"current_steps": 6900, "total_steps": 93654, "loss": 1.0008, "learning_rate": 4.950141801135034e-05, "epoch": 0.22102633096290603, "percentage": 7.37, "elapsed_time": "9:40:29", "remaining_time": "5 days, 1:38:39", "throughput": 1622.88, "total_tokens": 56524800} {"current_steps": 7000, "total_steps": 93654, "loss": 0.9889, "learning_rate": 4.948443251978968e-05, "epoch": 0.2242296111217887, "percentage": 7.47, "elapsed_time": "9:48:22", "remaining_time": "5 days, 1:23:38", "throughput": 1624.35, "total_tokens": 57344000} {"current_steps": 7100, "total_steps": 93654, "loss": 0.9869, "learning_rate": 4.946716553948987e-05, "epoch": 0.2274328912806714, "percentage": 7.58, "elapsed_time": "9:56:16", "remaining_time": "5 days, 1:09:05", "throughput": 1625.72, "total_tokens": 58163200} {"current_steps": 7200, "total_steps": 93654, "loss": 0.9669, "learning_rate": 4.9449617268963164e-05, "epoch": 0.23063617143955412, "percentage": 7.69, "elapsed_time": "10:04:09", "remaining_time": "5 days, 0:54:29", "throughput": 1627.11, "total_tokens": 58982400} {"current_steps": 7300, "total_steps": 93654, "loss": 1.0426, "learning_rate": 4.943178790995576e-05, "epoch": 0.2338394515984368, "percentage": 7.79, "elapsed_time": "10:12:03", "remaining_time": "5 days, 0:40:11", "throughput": 1628.44, "total_tokens": 59801600} {"current_steps": 7400, "total_steps": 93654, "loss": 0.9894, "learning_rate": 4.941367766744539e-05, "epoch": 0.2370427317573195, "percentage": 7.9, "elapsed_time": "10:19:56", "remaining_time": "5 days, 0:25:58", "throughput": 1629.75, "total_tokens": 60620800} {"current_steps": 7500, "total_steps": 93654, "loss": 0.996, "learning_rate": 4.939528674963902e-05, "epoch": 0.24024601191620218, "percentage": 8.01, "elapsed_time": "10:27:48", "remaining_time": "5 days, 0:11:47", "throughput": 1631.06, "total_tokens": 61440000} {"current_steps": 7600, "total_steps": 93654, "loss": 1.0557, "learning_rate": 4.937661536797044e-05, "epoch": 0.2434492920750849, "percentage": 8.11, "elapsed_time": "10:35:42", "remaining_time": "4 days, 23:57:58", "throughput": 1632.3, "total_tokens": 62259200} {"current_steps": 7700, "total_steps": 93654, "loss": 1.0614, "learning_rate": 4.9357663737097824e-05, "epoch": 0.24665257223396758, "percentage": 8.22, "elapsed_time": "10:43:34", "remaining_time": "4 days, 23:44:05", "throughput": 1633.55, "total_tokens": 63078400} {"current_steps": 7800, "total_steps": 93654, "loss": 1.0525, "learning_rate": 4.9338432074901276e-05, "epoch": 0.24985585239285027, "percentage": 8.33, "elapsed_time": "10:51:28", "remaining_time": "4 days, 23:30:38", "throughput": 1634.71, "total_tokens": 63897600} {"current_steps": 7900, "total_steps": 93654, "loss": 1.0947, "learning_rate": 4.931892060248032e-05, "epoch": 0.25305913255173296, "percentage": 8.44, "elapsed_time": "10:59:22", "remaining_time": "4 days, 23:17:23", "throughput": 1635.83, "total_tokens": 64716800} {"current_steps": 8000, "total_steps": 93654, "loss": 0.9886, "learning_rate": 4.929912954415135e-05, "epoch": 0.2562624127106157, "percentage": 8.54, "elapsed_time": "11:07:15", "remaining_time": "4 days, 23:04:07", "throughput": 1636.96, "total_tokens": 65536000} {"current_steps": 8100, "total_steps": 93654, "loss": 1.0407, "learning_rate": 4.9279059127445074e-05, "epoch": 0.2594656928694984, "percentage": 8.65, "elapsed_time": "11:15:09", "remaining_time": "4 days, 22:51:05", "throughput": 1638.03, "total_tokens": 66355200} {"current_steps": 8200, "total_steps": 93654, "loss": 1.021, "learning_rate": 4.925870958310388e-05, "epoch": 0.26266897302838105, "percentage": 8.76, "elapsed_time": "11:23:02", "remaining_time": "4 days, 22:38:11", "throughput": 1639.09, "total_tokens": 67174400} {"current_steps": 8300, "total_steps": 93654, "loss": 1.027, "learning_rate": 4.923808114507916e-05, "epoch": 0.26587225318726376, "percentage": 8.86, "elapsed_time": "11:30:56", "remaining_time": "4 days, 22:25:21", "throughput": 1640.12, "total_tokens": 67993600} {"current_steps": 8400, "total_steps": 93654, "loss": 1.0552, "learning_rate": 4.921717405052868e-05, "epoch": 0.2690755333461465, "percentage": 8.97, "elapsed_time": "11:38:49", "remaining_time": "4 days, 22:12:30", "throughput": 1641.17, "total_tokens": 68812800} {"current_steps": 8500, "total_steps": 93654, "loss": 1.0552, "learning_rate": 4.9195988539813814e-05, "epoch": 0.27227881350502914, "percentage": 9.08, "elapsed_time": "11:46:41", "remaining_time": "4 days, 21:59:43", "throughput": 1642.21, "total_tokens": 69632000} {"current_steps": 8600, "total_steps": 93654, "loss": 1.0516, "learning_rate": 4.917452485649677e-05, "epoch": 0.27548209366391185, "percentage": 9.18, "elapsed_time": "11:54:35", "remaining_time": "4 days, 21:47:22", "throughput": 1643.14, "total_tokens": 70451200} {"current_steps": 8700, "total_steps": 93654, "loss": 1.0425, "learning_rate": 4.9152783247337823e-05, "epoch": 0.27868537382279457, "percentage": 9.29, "elapsed_time": "12:02:28", "remaining_time": "4 days, 21:34:47", "throughput": 1644.14, "total_tokens": 71270400} {"current_steps": 8800, "total_steps": 93654, "loss": 1.0633, "learning_rate": 4.9130763962292453e-05, "epoch": 0.28188865398167723, "percentage": 9.4, "elapsed_time": "12:10:20", "remaining_time": "4 days, 21:22:20", "throughput": 1645.11, "total_tokens": 72089600} {"current_steps": 8900, "total_steps": 93654, "loss": 1.0208, "learning_rate": 4.9108467254508487e-05, "epoch": 0.28509193414055994, "percentage": 9.5, "elapsed_time": "12:18:11", "remaining_time": "4 days, 21:09:47", "throughput": 1646.1, "total_tokens": 72908800} {"current_steps": 9000, "total_steps": 93654, "loss": 1.0193, "learning_rate": 4.908589338032316e-05, "epoch": 0.2882952142994426, "percentage": 9.61, "elapsed_time": "12:26:05", "remaining_time": "4 days, 20:57:46", "throughput": 1646.98, "total_tokens": 73728000} {"current_steps": 9100, "total_steps": 93654, "loss": 0.9783, "learning_rate": 4.9063042599260234e-05, "epoch": 0.2914984944583253, "percentage": 9.72, "elapsed_time": "12:33:57", "remaining_time": "4 days, 20:45:31", "throughput": 1647.9, "total_tokens": 74547200} {"current_steps": 9200, "total_steps": 93654, "loss": 1.0251, "learning_rate": 4.9039915174026916e-05, "epoch": 0.29470177461720803, "percentage": 9.82, "elapsed_time": "12:41:52", "remaining_time": "4 days, 20:33:49", "throughput": 1648.71, "total_tokens": 75366400} {"current_steps": 9300, "total_steps": 93654, "loss": 1.009, "learning_rate": 4.9016511370510945e-05, "epoch": 0.2979050547760907, "percentage": 9.93, "elapsed_time": "12:49:43", "remaining_time": "4 days, 20:21:37", "throughput": 1649.64, "total_tokens": 76185600} {"current_steps": 9400, "total_steps": 93654, "loss": 1.0154, "learning_rate": 4.8992831457777446e-05, "epoch": 0.3011083349349734, "percentage": 10.04, "elapsed_time": "12:57:36", "remaining_time": "4 days, 20:09:51", "throughput": 1650.46, "total_tokens": 77004800} {"current_steps": 9500, "total_steps": 93654, "loss": 1.0498, "learning_rate": 4.896887570806588e-05, "epoch": 0.3043116150938561, "percentage": 10.14, "elapsed_time": "13:05:29", "remaining_time": "4 days, 19:58:07", "throughput": 1651.28, "total_tokens": 77824000} {"current_steps": 9600, "total_steps": 93654, "loss": 1.0426, "learning_rate": 4.89446443967869e-05, "epoch": 0.3075148952527388, "percentage": 10.25, "elapsed_time": "13:13:24", "remaining_time": "4 days, 19:46:44", "throughput": 1652.02, "total_tokens": 78643200} {"current_steps": 9700, "total_steps": 93654, "loss": 0.9947, "learning_rate": 4.892013780251922e-05, "epoch": 0.3107181754116215, "percentage": 10.36, "elapsed_time": "13:21:18", "remaining_time": "4 days, 19:35:22", "throughput": 1652.76, "total_tokens": 79462400} {"current_steps": 9800, "total_steps": 93654, "loss": 1.0301, "learning_rate": 4.889535620700635e-05, "epoch": 0.3139214555705042, "percentage": 10.46, "elapsed_time": "13:29:11", "remaining_time": "4 days, 19:23:50", "throughput": 1653.54, "total_tokens": 80281600} {"current_steps": 9900, "total_steps": 93654, "loss": 0.976, "learning_rate": 4.887029989515341e-05, "epoch": 0.3171247357293869, "percentage": 10.57, "elapsed_time": "13:37:03", "remaining_time": "4 days, 19:12:17", "throughput": 1654.33, "total_tokens": 81100800} {"current_steps": 10000, "total_steps": 93654, "loss": 1.0477, "learning_rate": 4.884496915502385e-05, "epoch": 0.3203280158882696, "percentage": 10.68, "elapsed_time": "13:44:56", "remaining_time": "4 days, 19:00:54", "throughput": 1655.08, "total_tokens": 81920000} {"current_steps": 10100, "total_steps": 93654, "loss": 1.0019, "learning_rate": 4.881936427783607e-05, "epoch": 0.3235312960471523, "percentage": 10.78, "elapsed_time": "13:52:49", "remaining_time": "4 days, 18:49:37", "throughput": 1655.81, "total_tokens": 82739200} {"current_steps": 10200, "total_steps": 93654, "loss": 0.997, "learning_rate": 4.879348555796018e-05, "epoch": 0.32673457620603497, "percentage": 10.89, "elapsed_time": "14:00:41", "remaining_time": "4 days, 18:38:16", "throughput": 1656.56, "total_tokens": 83558400} {"current_steps": 10300, "total_steps": 93654, "loss": 0.9891, "learning_rate": 4.8767333292914544e-05, "epoch": 0.3299378563649177, "percentage": 11.0, "elapsed_time": "14:08:34", "remaining_time": "4 days, 18:27:11", "throughput": 1657.24, "total_tokens": 84377600} {"current_steps": 10400, "total_steps": 93654, "loss": 1.0175, "learning_rate": 4.874090778336235e-05, "epoch": 0.3331411365238004, "percentage": 11.1, "elapsed_time": "14:16:26", "remaining_time": "4 days, 18:15:59", "throughput": 1657.96, "total_tokens": 85196800} {"current_steps": 10500, "total_steps": 93654, "loss": 1.0151, "learning_rate": 4.8714209333108236e-05, "epoch": 0.33634441668268306, "percentage": 11.21, "elapsed_time": "14:24:17", "remaining_time": "4 days, 18:04:39", "throughput": 1658.71, "total_tokens": 86016000} {"current_steps": 10600, "total_steps": 93654, "loss": 1.025, "learning_rate": 4.868723824909469e-05, "epoch": 0.33954769684156577, "percentage": 11.32, "elapsed_time": "14:32:10", "remaining_time": "4 days, 17:53:43", "throughput": 1659.36, "total_tokens": 86835200} {"current_steps": 10700, "total_steps": 93654, "loss": 1.0334, "learning_rate": 4.8659994841398594e-05, "epoch": 0.3427509770004485, "percentage": 11.43, "elapsed_time": "14:40:03", "remaining_time": "4 days, 17:42:47", "throughput": 1660.02, "total_tokens": 87654400} {"current_steps": 10800, "total_steps": 93654, "loss": 1.0237, "learning_rate": 4.863247942322764e-05, "epoch": 0.34595425715933115, "percentage": 11.53, "elapsed_time": "14:47:56", "remaining_time": "4 days, 17:32:02", "throughput": 1660.64, "total_tokens": 88473600} {"current_steps": 10900, "total_steps": 93654, "loss": 1.0181, "learning_rate": 4.860469231091671e-05, "epoch": 0.34915753731821386, "percentage": 11.64, "elapsed_time": "14:55:49", "remaining_time": "4 days, 17:21:14", "throughput": 1661.27, "total_tokens": 89292800} {"current_steps": 11000, "total_steps": 93654, "loss": 1.0289, "learning_rate": 4.857663382392428e-05, "epoch": 0.3523608174770965, "percentage": 11.75, "elapsed_time": "15:03:41", "remaining_time": "4 days, 17:10:19", "throughput": 1661.93, "total_tokens": 90112000} {"current_steps": 11100, "total_steps": 93654, "loss": 1.0296, "learning_rate": 4.854830428482871e-05, "epoch": 0.35556409763597924, "percentage": 11.85, "elapsed_time": "15:11:35", "remaining_time": "4 days, 16:59:43", "throughput": 1662.51, "total_tokens": 90931200} {"current_steps": 11200, "total_steps": 93654, "loss": 0.9784, "learning_rate": 4.851970401932454e-05, "epoch": 0.35876737779486195, "percentage": 11.96, "elapsed_time": "15:19:25", "remaining_time": "4 days, 16:48:46", "throughput": 1663.18, "total_tokens": 91750400} {"current_steps": 11300, "total_steps": 93654, "loss": 1.0842, "learning_rate": 4.849083335621878e-05, "epoch": 0.3619706579537446, "percentage": 12.07, "elapsed_time": "15:27:31", "remaining_time": "4 days, 16:39:49", "throughput": 1663.37, "total_tokens": 92569600} {"current_steps": 11400, "total_steps": 93654, "loss": 1.0196, "learning_rate": 4.846169262742709e-05, "epoch": 0.3651739381126273, "percentage": 12.17, "elapsed_time": "15:35:21", "remaining_time": "4 days, 16:28:49", "throughput": 1664.06, "total_tokens": 93388800} {"current_steps": 11500, "total_steps": 93654, "loss": 1.0103, "learning_rate": 4.843228216796996e-05, "epoch": 0.36837721827151004, "percentage": 12.28, "elapsed_time": "15:43:09", "remaining_time": "4 days, 16:17:44", "throughput": 1664.76, "total_tokens": 94208000} {"current_steps": 11600, "total_steps": 93654, "loss": 1.0551, "learning_rate": 4.8402602315968905e-05, "epoch": 0.3715804984303927, "percentage": 12.39, "elapsed_time": "15:50:49", "remaining_time": "4 days, 16:05:49", "throughput": 1665.68, "total_tokens": 95027200} {"current_steps": 11700, "total_steps": 93654, "loss": 1.0221, "learning_rate": 4.837265341264253e-05, "epoch": 0.3747837785892754, "percentage": 12.49, "elapsed_time": "15:58:09", "remaining_time": "4 days, 15:51:34", "throughput": 1667.19, "total_tokens": 95846400} {"current_steps": 11800, "total_steps": 93654, "loss": 0.975, "learning_rate": 4.834243580230266e-05, "epoch": 0.37798705874815813, "percentage": 12.6, "elapsed_time": "16:06:02", "remaining_time": "4 days, 15:41:10", "throughput": 1667.74, "total_tokens": 96665600} {"current_steps": 11900, "total_steps": 93654, "loss": 1.0152, "learning_rate": 4.831194983235029e-05, "epoch": 0.3811903389070408, "percentage": 12.71, "elapsed_time": "16:15:14", "remaining_time": "4 days, 15:40:00", "throughput": 1665.99, "total_tokens": 97484800} {"current_steps": 12000, "total_steps": 93654, "loss": 0.9909, "learning_rate": 4.82811958532717e-05, "epoch": 0.3843936190659235, "percentage": 12.81, "elapsed_time": "16:23:20", "remaining_time": "4 days, 15:31:11", "throughput": 1666.15, "total_tokens": 98304000} {"current_steps": 12100, "total_steps": 93654, "loss": 1.0208, "learning_rate": 4.825017421863436e-05, "epoch": 0.3875968992248062, "percentage": 12.92, "elapsed_time": "16:31:16", "remaining_time": "4 days, 15:21:09", "throughput": 1666.6, "total_tokens": 99123200} {"current_steps": 12200, "total_steps": 93654, "loss": 1.0189, "learning_rate": 4.821888528508287e-05, "epoch": 0.3908001793836889, "percentage": 13.03, "elapsed_time": "16:38:54", "remaining_time": "4 days, 15:09:18", "throughput": 1667.52, "total_tokens": 99942400} {"current_steps": 12300, "total_steps": 93654, "loss": 1.055, "learning_rate": 4.8187329412334884e-05, "epoch": 0.3940034595425716, "percentage": 13.13, "elapsed_time": "16:46:35", "remaining_time": "4 days, 14:57:47", "throughput": 1668.35, "total_tokens": 100761600} {"current_steps": 12400, "total_steps": 93654, "loss": 1.0586, "learning_rate": 4.815550696317695e-05, "epoch": 0.3972067397014543, "percentage": 13.24, "elapsed_time": "16:54:15", "remaining_time": "4 days, 14:46:10", "throughput": 1669.21, "total_tokens": 101580800} {"current_steps": 12500, "total_steps": 93654, "loss": 1.0073, "learning_rate": 4.812341830346035e-05, "epoch": 0.400410019860337, "percentage": 13.35, "elapsed_time": "17:01:55", "remaining_time": "4 days, 14:34:42", "throughput": 1670.04, "total_tokens": 102400000} {"current_steps": 12600, "total_steps": 93654, "loss": 1.0012, "learning_rate": 4.80910638020969e-05, "epoch": 0.4036133000192197, "percentage": 13.45, "elapsed_time": "17:09:40", "remaining_time": "4 days, 14:23:42", "throughput": 1670.75, "total_tokens": 103219200} {"current_steps": 12700, "total_steps": 93654, "loss": 0.9919, "learning_rate": 4.805844383105469e-05, "epoch": 0.40681658017810235, "percentage": 13.56, "elapsed_time": "17:17:24", "remaining_time": "4 days, 14:12:48", "throughput": 1671.44, "total_tokens": 104038400} {"current_steps": 12800, "total_steps": 93654, "loss": 1.0369, "learning_rate": 4.802555876535383e-05, "epoch": 0.41001986033698506, "percentage": 13.67, "elapsed_time": "17:25:33", "remaining_time": "4 days, 14:04:27", "throughput": 1671.49, "total_tokens": 104857600} {"current_steps": 12900, "total_steps": 93654, "loss": 1.0105, "learning_rate": 4.799240898306214e-05, "epoch": 0.4132231404958678, "percentage": 13.77, "elapsed_time": "17:33:16", "remaining_time": "4 days, 13:53:29", "throughput": 1672.2, "total_tokens": 105676800} {"current_steps": 13000, "total_steps": 93654, "loss": 0.9861, "learning_rate": 4.7958994865290766e-05, "epoch": 0.41642642065475044, "percentage": 13.88, "elapsed_time": "17:40:57", "remaining_time": "4 days, 13:42:21", "throughput": 1672.95, "total_tokens": 106496000} {"current_steps": 13100, "total_steps": 93654, "loss": 0.9772, "learning_rate": 4.7925316796189826e-05, "epoch": 0.41962970081363316, "percentage": 13.99, "elapsed_time": "17:50:29", "remaining_time": "4 days, 13:42:39", "throughput": 1670.8, "total_tokens": 107315200} {"current_steps": 13200, "total_steps": 93654, "loss": 1.0186, "learning_rate": 4.789137516294402e-05, "epoch": 0.42283298097251587, "percentage": 14.09, "elapsed_time": "18:00:15", "remaining_time": "4 days, 13:44:10", "throughput": 1668.34, "total_tokens": 108134400} {"current_steps": 13300, "total_steps": 93654, "loss": 1.036, "learning_rate": 4.785717035576812e-05, "epoch": 0.42603626113139853, "percentage": 14.2, "elapsed_time": "18:08:53", "remaining_time": "4 days, 13:38:40", "throughput": 1667.66, "total_tokens": 108953600} {"current_steps": 13400, "total_steps": 93654, "loss": 1.0709, "learning_rate": 4.782270276790254e-05, "epoch": 0.42923954129028125, "percentage": 14.31, "elapsed_time": "18:17:06", "remaining_time": "4 days, 13:30:43", "throughput": 1667.6, "total_tokens": 109772800} {"current_steps": 13500, "total_steps": 93654, "loss": 0.9704, "learning_rate": 4.778797279560876e-05, "epoch": 0.43244282144916396, "percentage": 14.41, "elapsed_time": "18:25:22", "remaining_time": "4 days, 13:22:58", "throughput": 1667.49, "total_tokens": 110592000} {"current_steps": 13600, "total_steps": 93654, "loss": 0.9966, "learning_rate": 4.775298083816482e-05, "epoch": 0.4356461016080466, "percentage": 14.52, "elapsed_time": "18:33:37", "remaining_time": "4 days, 13:15:10", "throughput": 1667.39, "total_tokens": 111411200} {"current_steps": 13100, "total_steps": 93654, "loss": 0.9771, "learning_rate": 4.7925316796189826e-05, "epoch": 0.41962970081363316, "percentage": 13.99, "elapsed_time": "0:09:02", "remaining_time": "0:55:38", "throughput": 197637.13, "total_tokens": 107315200} {"current_steps": 13200, "total_steps": 93654, "loss": 1.0188, "learning_rate": 4.789137516294402e-05, "epoch": 0.42283298097251587, "percentage": 14.09, "elapsed_time": "0:17:18", "remaining_time": "1:45:29", "throughput": 104132.7, "total_tokens": 108134400} {"current_steps": 13300, "total_steps": 93654, "loss": 1.0355, "learning_rate": 4.785717035576812e-05, "epoch": 0.42603626113139853, "percentage": 14.2, "elapsed_time": "0:25:31", "remaining_time": "2:34:15", "throughput": 71119.82, "total_tokens": 108953600} {"current_steps": 13400, "total_steps": 93654, "loss": 1.0711, "learning_rate": 4.782270276790254e-05, "epoch": 0.42923954129028125, "percentage": 14.31, "elapsed_time": "0:33:48", "remaining_time": "3:22:29", "throughput": 54111.89, "total_tokens": 109772800} {"current_steps": 13100, "total_steps": 93654, "loss": 0.9772, "learning_rate": 4.7925316796189826e-05, "epoch": 0.41962970081363316, "percentage": 13.99, "elapsed_time": "0:08:16", "remaining_time": "0:50:55", "throughput": 216003.42, "total_tokens": 107315200} {"current_steps": 13200, "total_steps": 93654, "loss": 1.0187, "learning_rate": 4.789137516294402e-05, "epoch": 0.42283298097251587, "percentage": 14.09, "elapsed_time": "0:16:24", "remaining_time": "1:40:03", "throughput": 109787.53, "total_tokens": 108134400} {"current_steps": 13300, "total_steps": 93654, "loss": 1.036, "learning_rate": 4.785717035576812e-05, "epoch": 0.42603626113139853, "percentage": 14.2, "elapsed_time": "0:24:30", "remaining_time": "2:28:05", "throughput": 74085.03, "total_tokens": 108953600} {"current_steps": 13400, "total_steps": 93654, "loss": 1.0706, "learning_rate": 4.782270276790254e-05, "epoch": 0.42923954129028125, "percentage": 14.31, "elapsed_time": "0:32:38", "remaining_time": "3:15:31", "throughput": 56038.85, "total_tokens": 109772800} {"current_steps": 13500, "total_steps": 93654, "loss": 0.9705, "learning_rate": 4.778797279560876e-05, "epoch": 0.43244282144916396, "percentage": 14.41, "elapsed_time": "0:40:45", "remaining_time": "4:01:57", "throughput": 45230.93, "total_tokens": 110592000} {"current_steps": 13600, "total_steps": 93654, "loss": 0.9968, "learning_rate": 4.775298083816482e-05, "epoch": 0.4356461016080466, "percentage": 14.52, "elapsed_time": "0:48:52", "remaining_time": "4:47:43", "throughput": 37988.84, "total_tokens": 111411200} {"current_steps": 13700, "total_steps": 93654, "loss": 1.033, "learning_rate": 4.77177272978607e-05, "epoch": 0.43884938176692934, "percentage": 14.63, "elapsed_time": "0:56:59", "remaining_time": "5:32:35", "throughput": 32821.92, "total_tokens": 112230400} {"current_steps": 13100, "total_steps": 93654, "loss": 0.9771, "learning_rate": 4.7925316796189826e-05, "epoch": 0.41962970081363316, "percentage": 13.99, "elapsed_time": "0:08:21", "remaining_time": "0:51:25", "throughput": 213864.45, "total_tokens": 107315200} {"current_steps": 13200, "total_steps": 93654, "loss": 1.0182, "learning_rate": 4.789137516294402e-05, "epoch": 0.42283298097251587, "percentage": 14.09, "elapsed_time": "0:16:22", "remaining_time": "1:39:47", "throughput": 110071.05, "total_tokens": 108134400} {"current_steps": 13300, "total_steps": 93654, "loss": 1.036, "learning_rate": 4.785717035576812e-05, "epoch": 0.42603626113139853, "percentage": 14.2, "elapsed_time": "0:24:21", "remaining_time": "2:27:12", "throughput": 74526.95, "total_tokens": 108953600} {"current_steps": 13400, "total_steps": 93654, "loss": 1.0713, "learning_rate": 4.782270276790254e-05, "epoch": 0.42923954129028125, "percentage": 14.31, "elapsed_time": "0:32:24", "remaining_time": "3:14:05", "throughput": 56455.61, "total_tokens": 109772800} {"current_steps": 13500, "total_steps": 93654, "loss": 0.9708, "learning_rate": 4.778797279560876e-05, "epoch": 0.43244282144916396, "percentage": 14.41, "elapsed_time": "0:40:24", "remaining_time": "3:59:54", "throughput": 45615.59, "total_tokens": 110592000} {"current_steps": 13600, "total_steps": 93654, "loss": 0.9967, "learning_rate": 4.775298083816482e-05, "epoch": 0.4356461016080466, "percentage": 14.52, "elapsed_time": "0:48:25", "remaining_time": "4:45:04", "throughput": 38340.63, "total_tokens": 111411200} {"current_steps": 13700, "total_steps": 93654, "loss": 1.0333, "learning_rate": 4.77177272978607e-05, "epoch": 0.43884938176692934, "percentage": 14.63, "elapsed_time": "0:56:26", "remaining_time": "5:29:23", "throughput": 33140.43, "total_tokens": 112230400} {"current_steps": 13800, "total_steps": 93654, "loss": 1.0308, "learning_rate": 4.768221257999373e-05, "epoch": 0.44205266192581205, "percentage": 14.74, "elapsed_time": "1:04:26", "remaining_time": "6:12:55", "throughput": 29235.53, "total_tokens": 113049600} {"current_steps": 13900, "total_steps": 93654, "loss": 1.057, "learning_rate": 4.764643709286386e-05, "epoch": 0.4452559420846947, "percentage": 14.84, "elapsed_time": "1:12:27", "remaining_time": "6:55:47", "throughput": 26189.01, "total_tokens": 113868800} {"current_steps": 14000, "total_steps": 93654, "loss": 1.0059, "learning_rate": 4.761040124776904e-05, "epoch": 0.4484592222435774, "percentage": 14.95, "elapsed_time": "1:20:27", "remaining_time": "7:37:45", "throughput": 23758.01, "total_tokens": 114688000} {"current_steps": 14100, "total_steps": 93654, "loss": 1.0717, "learning_rate": 4.757410545900047e-05, "epoch": 0.45166250240246014, "percentage": 15.06, "elapsed_time": "1:28:57", "remaining_time": "8:21:55", "throughput": 21640.53, "total_tokens": 115507200} {"current_steps": 14200, "total_steps": 93654, "loss": 1.0313, "learning_rate": 4.7537550143837796e-05, "epoch": 0.4548657825613428, "percentage": 15.16, "elapsed_time": "1:36:58", "remaining_time": "9:02:35", "throughput": 19993.1, "total_tokens": 116326400} {"current_steps": 14300, "total_steps": 93654, "loss": 1.0296, "learning_rate": 4.750073572254438e-05, "epoch": 0.4580690627202255, "percentage": 15.27, "elapsed_time": "1:44:57", "remaining_time": "9:42:25", "throughput": 18602.26, "total_tokens": 117145600} {"current_steps": 14400, "total_steps": 93654, "loss": 0.9977, "learning_rate": 4.746366261836242e-05, "epoch": 0.46127234287910823, "percentage": 15.38, "elapsed_time": "1:52:57", "remaining_time": "10:21:42", "throughput": 17405.07, "total_tokens": 117964800} {"current_steps": 14500, "total_steps": 93654, "loss": 0.9753, "learning_rate": 4.742633125750808e-05, "epoch": 0.4644756230379909, "percentage": 15.48, "elapsed_time": "2:00:57", "remaining_time": "11:00:17", "throughput": 16367.32, "total_tokens": 118784000} {"current_steps": 14600, "total_steps": 93654, "loss": 0.9722, "learning_rate": 4.738874206916665e-05, "epoch": 0.4676789031968736, "percentage": 15.59, "elapsed_time": "2:08:57", "remaining_time": "11:38:18", "throughput": 15456.81, "total_tokens": 119603200} {"current_steps": 14700, "total_steps": 93654, "loss": 1.066, "learning_rate": 4.7350895485487526e-05, "epoch": 0.47088218335575627, "percentage": 15.7, "elapsed_time": "2:16:57", "remaining_time": "12:15:36", "throughput": 14654.25, "total_tokens": 120422400} {"current_steps": 14800, "total_steps": 93654, "loss": 0.973, "learning_rate": 4.731279194157933e-05, "epoch": 0.474085463514639, "percentage": 15.8, "elapsed_time": "2:24:55", "remaining_time": "12:52:10", "throughput": 13942.79, "total_tokens": 121241600} {"current_steps": 14900, "total_steps": 93654, "loss": 0.9922, "learning_rate": 4.727443187550481e-05, "epoch": 0.4772887436735217, "percentage": 15.91, "elapsed_time": "2:32:59", "remaining_time": "13:28:39", "throughput": 13296.84, "total_tokens": 122060800} {"current_steps": 15000, "total_steps": 93654, "loss": 0.9851, "learning_rate": 4.723581572827592e-05, "epoch": 0.48049202383240436, "percentage": 16.02, "elapsed_time": "2:41:54", "remaining_time": "14:08:58", "throughput": 12649.29, "total_tokens": 122880000} {"current_steps": 15100, "total_steps": 93654, "loss": 1.0284, "learning_rate": 4.719694394384863e-05, "epoch": 0.4836953039912871, "percentage": 16.12, "elapsed_time": "2:52:06", "remaining_time": "14:55:20", "throughput": 11978.88, "total_tokens": 123699200} {"current_steps": 15200, "total_steps": 93654, "loss": 0.9828, "learning_rate": 4.715781696911792e-05, "epoch": 0.4868985841501698, "percentage": 16.23, "elapsed_time": "3:02:25", "remaining_time": "15:41:34", "throughput": 11376.31, "total_tokens": 124518400} {"current_steps": 15300, "total_steps": 93654, "loss": 0.9621, "learning_rate": 4.7118435253912575e-05, "epoch": 0.49010186430905245, "percentage": 16.34, "elapsed_time": "3:13:14", "remaining_time": "16:29:36", "throughput": 10810.32, "total_tokens": 125337600} {"current_steps": 15400, "total_steps": 93654, "loss": 1.013, "learning_rate": 4.7078799250990056e-05, "epoch": 0.49330514446793516, "percentage": 16.44, "elapsed_time": "3:23:25", "remaining_time": "17:13:40", "throughput": 10336.19, "total_tokens": 126156800} {"current_steps": 15500, "total_steps": 93654, "loss": 1.0564, "learning_rate": 4.7038909416031276e-05, "epoch": 0.4965084246268179, "percentage": 16.55, "elapsed_time": "3:33:32", "remaining_time": "17:56:43", "throughput": 9910.26, "total_tokens": 126976000} {"current_steps": 15600, "total_steps": 93654, "loss": 0.9828, "learning_rate": 4.699876620763535e-05, "epoch": 0.49971170478570054, "percentage": 16.66, "elapsed_time": "3:43:52", "remaining_time": "18:40:11", "throughput": 9513.6, "total_tokens": 127795200} {"current_steps": 15700, "total_steps": 93654, "loss": 1.0435, "learning_rate": 4.6958370087314344e-05, "epoch": 0.5029149849445832, "percentage": 16.76, "elapsed_time": "3:53:30", "remaining_time": "19:19:24", "throughput": 9179.94, "total_tokens": 128614400} {"current_steps": 15800, "total_steps": 93654, "loss": 0.9438, "learning_rate": 4.691772151948799e-05, "epoch": 0.5061182651034659, "percentage": 16.87, "elapsed_time": "4:02:45", "remaining_time": "19:56:11", "throughput": 8886.31, "total_tokens": 129433600} {"current_steps": 15900, "total_steps": 93654, "loss": 0.947, "learning_rate": 4.687682097147826e-05, "epoch": 0.5093215452623486, "percentage": 16.98, "elapsed_time": "4:11:57", "remaining_time": "20:32:06", "throughput": 8616.15, "total_tokens": 130252800} {"current_steps": 16000, "total_steps": 93654, "loss": 0.9461, "learning_rate": 4.683566891350412e-05, "epoch": 0.5125248254212313, "percentage": 17.08, "elapsed_time": "4:20:18", "remaining_time": "21:03:23", "throughput": 8391.93, "total_tokens": 131072000} {"current_steps": 16100, "total_steps": 93654, "loss": 0.9964, "learning_rate": 4.679426581867599e-05, "epoch": 0.5157281055801141, "percentage": 17.19, "elapsed_time": "4:28:53", "remaining_time": "21:35:13", "throughput": 8175.23, "total_tokens": 131891200} {"current_steps": 16200, "total_steps": 93654, "loss": 0.9499, "learning_rate": 4.675261216299042e-05, "epoch": 0.5189313857389968, "percentage": 17.3, "elapsed_time": "4:37:10", "remaining_time": "22:05:11", "throughput": 7980.05, "total_tokens": 132710400} {"current_steps": 16300, "total_steps": 93654, "loss": 1.0205, "learning_rate": 4.6710708425324545e-05, "epoch": 0.5221346658978794, "percentage": 17.4, "elapsed_time": "4:45:21", "remaining_time": "22:34:14", "throughput": 7798.76, "total_tokens": 133529600} {"current_steps": 16400, "total_steps": 93654, "loss": 0.9996, "learning_rate": 4.6668555087430605e-05, "epoch": 0.5253379460567621, "percentage": 17.51, "elapsed_time": "4:53:33", "remaining_time": "23:02:51", "throughput": 7627.46, "total_tokens": 134348800} {"current_steps": 16500, "total_steps": 93654, "loss": 1.0013, "learning_rate": 4.662615263393041e-05, "epoch": 0.5285412262156448, "percentage": 17.62, "elapsed_time": "5:01:43", "remaining_time": "23:30:52", "throughput": 7466.37, "total_tokens": 135168000} {"current_steps": 16600, "total_steps": 93654, "loss": 1.0437, "learning_rate": 4.658350155230976e-05, "epoch": 0.5317445063745275, "percentage": 17.72, "elapsed_time": "5:09:55", "remaining_time": "23:58:37", "throughput": 7312.82, "total_tokens": 135987200} {"current_steps": 16700, "total_steps": 93654, "loss": 1.0094, "learning_rate": 4.6540602332912854e-05, "epoch": 0.5349477865334102, "percentage": 17.83, "elapsed_time": "5:18:08", "remaining_time": "1 day, 0:25:59", "throughput": 7167.01, "total_tokens": 136806400} {"current_steps": 16800, "total_steps": 93654, "loss": 1.0141, "learning_rate": 4.6497455468936606e-05, "epoch": 0.538151066692293, "percentage": 17.94, "elapsed_time": "5:26:18", "remaining_time": "1 day, 0:52:45", "throughput": 7029.35, "total_tokens": 137625600} {"current_steps": 16900, "total_steps": 93654, "loss": 1.0359, "learning_rate": 4.645406145642506e-05, "epoch": 0.5413543468511756, "percentage": 18.05, "elapsed_time": "5:34:29", "remaining_time": "1 day, 1:19:08", "throughput": 6898.3, "total_tokens": 138444800} {"current_steps": 17000, "total_steps": 93654, "loss": 0.9605, "learning_rate": 4.64104207942636e-05, "epoch": 0.5445576270100583, "percentage": 18.15, "elapsed_time": "5:44:54", "remaining_time": "1 day, 1:55:11", "throughput": 6729.6, "total_tokens": 139264000} {"current_steps": 17100, "total_steps": 93654, "loss": 0.9502, "learning_rate": 4.6366533984173274e-05, "epoch": 0.547760907168941, "percentage": 18.26, "elapsed_time": "5:56:22", "remaining_time": "1 day, 2:35:27", "throughput": 6551.21, "total_tokens": 140083200} {"current_steps": 17200, "total_steps": 93654, "loss": 1.016, "learning_rate": 4.6322401530704995e-05, "epoch": 0.5509641873278237, "percentage": 18.37, "elapsed_time": "6:07:36", "remaining_time": "1 day, 3:14:01", "throughput": 6388.21, "total_tokens": 140902400} {"current_steps": 17300, "total_steps": 93654, "loss": 1.0039, "learning_rate": 4.627802394123375e-05, "epoch": 0.5541674674867064, "percentage": 18.47, "elapsed_time": "6:18:47", "remaining_time": "1 day, 3:51:47", "throughput": 6235.76, "total_tokens": 141721600} {"current_steps": 17400, "total_steps": 93654, "loss": 0.9972, "learning_rate": 4.623340172595277e-05, "epoch": 0.5573707476455891, "percentage": 18.58, "elapsed_time": "6:29:58", "remaining_time": "1 day, 4:28:59", "throughput": 6092.01, "total_tokens": 142540800} {"current_steps": 17500, "total_steps": 93654, "loss": 0.9894, "learning_rate": 4.6188535397867675e-05, "epoch": 0.5605740278044717, "percentage": 18.69, "elapsed_time": "6:41:12", "remaining_time": "1 day, 5:05:55", "throughput": 5955.33, "total_tokens": 143360000} {"current_steps": 17600, "total_steps": 93654, "loss": 1.0721, "learning_rate": 4.614342547279052e-05, "epoch": 0.5637773079633545, "percentage": 18.79, "elapsed_time": "6:52:27", "remaining_time": "1 day, 5:42:19", "throughput": 5826.02, "total_tokens": 144179200} {"current_steps": 17700, "total_steps": 93654, "loss": 1.0183, "learning_rate": 4.609807246933395e-05, "epoch": 0.5669805881222372, "percentage": 18.9, "elapsed_time": "7:03:40", "remaining_time": "1 day, 6:18:05", "throughput": 5703.91, "total_tokens": 144998400} {"current_steps": 17800, "total_steps": 93654, "loss": 1.0083, "learning_rate": 4.605247690890518e-05, "epoch": 0.5701838682811199, "percentage": 19.01, "elapsed_time": "7:14:52", "remaining_time": "1 day, 6:53:11", "throughput": 5588.53, "total_tokens": 145817600} {"current_steps": 17900, "total_steps": 93654, "loss": 0.9927, "learning_rate": 4.600663931570001e-05, "epoch": 0.5733871484400026, "percentage": 19.11, "elapsed_time": "7:26:01", "remaining_time": "1 day, 7:27:35", "throughput": 5479.45, "total_tokens": 146636800} {"current_steps": 18000, "total_steps": 93654, "loss": 1.0144, "learning_rate": 4.596056021669681e-05, "epoch": 0.5765904285988852, "percentage": 19.22, "elapsed_time": "7:37:13", "remaining_time": "1 day, 8:01:44", "throughput": 5374.97, "total_tokens": 147456000} {"current_steps": 18100, "total_steps": 93654, "loss": 1.0417, "learning_rate": 4.591424014165047e-05, "epoch": 0.5797937087577679, "percentage": 19.33, "elapsed_time": "7:48:39", "remaining_time": "1 day, 8:36:19", "throughput": 5272.96, "total_tokens": 148275200} {"current_steps": 18200, "total_steps": 93654, "loss": 1.0124, "learning_rate": 4.586767962308625e-05, "epoch": 0.5829969889166506, "percentage": 19.43, "elapsed_time": "7:59:52", "remaining_time": "1 day, 9:09:29", "throughput": 5178.19, "total_tokens": 149094400} {"current_steps": 18300, "total_steps": 93654, "loss": 0.9961, "learning_rate": 4.5820879196293756e-05, "epoch": 0.5862002690755334, "percentage": 19.54, "elapsed_time": "8:11:04", "remaining_time": "1 day, 9:42:05", "throughput": 5087.96, "total_tokens": 149913600} {"current_steps": 18400, "total_steps": 93654, "loss": 1.0066, "learning_rate": 4.577383939932069e-05, "epoch": 0.5894035492344161, "percentage": 19.65, "elapsed_time": "8:22:16", "remaining_time": "1 day, 10:14:16", "throughput": 5001.6, "total_tokens": 150732800} {"current_steps": 18500, "total_steps": 93654, "loss": 1.0422, "learning_rate": 4.572656077296676e-05, "epoch": 0.5926068293932988, "percentage": 19.75, "elapsed_time": "8:32:32", "remaining_time": "1 day, 10:42:08", "throughput": 4928.1, "total_tokens": 151552000} {"current_steps": 18600, "total_steps": 93654, "loss": 1.0647, "learning_rate": 4.567904386077734e-05, "epoch": 0.5958101095521814, "percentage": 19.86, "elapsed_time": "8:45:06", "remaining_time": "1 day, 11:18:53", "throughput": 4836.2, "total_tokens": 152371200} {"current_steps": 18700, "total_steps": 93654, "loss": 1.0465, "learning_rate": 4.563128920903735e-05, "epoch": 0.5990133897110641, "percentage": 19.97, "elapsed_time": "8:56:24", "remaining_time": "1 day, 11:50:04", "throughput": 4759.72, "total_tokens": 153190400} {"current_steps": 18800, "total_steps": 93654, "loss": 1.0505, "learning_rate": 4.558329736676488e-05, "epoch": 0.6022166698699468, "percentage": 20.07, "elapsed_time": "9:07:52", "remaining_time": "1 day, 12:21:26", "throughput": 4685.0, "total_tokens": 154009600} {"current_steps": 18900, "total_steps": 93654, "loss": 1.0287, "learning_rate": 4.553506888570494e-05, "epoch": 0.6054199500288295, "percentage": 20.18, "elapsed_time": "9:18:48", "remaining_time": "1 day, 12:50:12", "throughput": 4617.84, "total_tokens": 154828800} {"current_steps": 19000, "total_steps": 93654, "loss": 0.9675, "learning_rate": 4.548660432032307e-05, "epoch": 0.6086232301877122, "percentage": 20.29, "elapsed_time": "9:27:46", "remaining_time": "1 day, 13:10:53", "throughput": 4568.91, "total_tokens": 155648000} {"current_steps": 19100, "total_steps": 93654, "loss": 1.0027, "learning_rate": 4.5437904227799e-05, "epoch": 0.611826510346595, "percentage": 20.39, "elapsed_time": "9:36:20", "remaining_time": "1 day, 13:29:40", "throughput": 4524.71, "total_tokens": 156467200} {"current_steps": 19200, "total_steps": 93654, "loss": 1.0002, "learning_rate": 4.538896916802023e-05, "epoch": 0.6150297905054776, "percentage": 20.5, "elapsed_time": "9:45:17", "remaining_time": "1 day, 13:49:38", "throughput": 4478.9, "total_tokens": 157286400} {"current_steps": 19300, "total_steps": 93654, "loss": 1.0698, "learning_rate": 4.533979970357558e-05, "epoch": 0.6182330706643603, "percentage": 20.61, "elapsed_time": "9:54:14", "remaining_time": "1 day, 14:09:18", "throughput": 4434.43, "total_tokens": 158105600} {"current_steps": 19400, "total_steps": 93654, "loss": 0.9834, "learning_rate": 4.529039639974876e-05, "epoch": 0.621436350823243, "percentage": 20.71, "elapsed_time": "10:03:21", "remaining_time": "1 day, 14:29:23", "throughput": 4389.97, "total_tokens": 158924800} {"current_steps": 19500, "total_steps": 93654, "loss": 0.9634, "learning_rate": 4.524075982451183e-05, "epoch": 0.6246396309821257, "percentage": 20.82, "elapsed_time": "10:12:24", "remaining_time": "1 day, 14:48:50", "throughput": 4347.45, "total_tokens": 159744000} {"current_steps": 19600, "total_steps": 93654, "loss": 1.0221, "learning_rate": 4.5190890548518696e-05, "epoch": 0.6278429111410084, "percentage": 20.93, "elapsed_time": "10:21:47", "remaining_time": "1 day, 15:09:16", "throughput": 4303.81, "total_tokens": 160563200} {"current_steps": 19700, "total_steps": 93654, "loss": 1.0582, "learning_rate": 4.5140789145098536e-05, "epoch": 0.631046191299891, "percentage": 21.03, "elapsed_time": "10:31:16", "remaining_time": "1 day, 15:29:48", "throughput": 4260.75, "total_tokens": 161382400} {"current_steps": 19800, "total_steps": 93654, "loss": 1.0112, "learning_rate": 4.509045619024921e-05, "epoch": 0.6342494714587738, "percentage": 21.14, "elapsed_time": "10:40:08", "remaining_time": "1 day, 15:47:44", "throughput": 4223.04, "total_tokens": 162201600} {"current_steps": 19900, "total_steps": 93654, "loss": 1.0078, "learning_rate": 4.5039892262630656e-05, "epoch": 0.6374527516176565, "percentage": 21.25, "elapsed_time": "10:49:05", "remaining_time": "1 day, 16:05:40", "throughput": 4185.88, "total_tokens": 163020800} {"current_steps": 20000, "total_steps": 93654, "loss": 1.0239, "learning_rate": 4.498909794355821e-05, "epoch": 0.6406560317765392, "percentage": 21.36, "elapsed_time": "10:57:46", "remaining_time": "1 day, 16:22:24", "throughput": 4151.34, "total_tokens": 163840000} {"current_steps": 20100, "total_steps": 93654, "loss": 1.0088, "learning_rate": 4.493807381699595e-05, "epoch": 0.6438593119354219, "percentage": 21.46, "elapsed_time": "11:06:45", "remaining_time": "1 day, 16:39:56", "throughput": 4115.92, "total_tokens": 164659200} {"current_steps": 20200, "total_steps": 93654, "loss": 0.9566, "learning_rate": 4.488682046954994e-05, "epoch": 0.6470625920943046, "percentage": 21.57, "elapsed_time": "11:15:26", "remaining_time": "1 day, 16:56:08", "throughput": 4083.19, "total_tokens": 165478400} {"current_steps": 20300, "total_steps": 93654, "loss": 1.0226, "learning_rate": 4.483533849046155e-05, "epoch": 0.6502658722531872, "percentage": 21.68, "elapsed_time": "11:24:11", "remaining_time": "1 day, 17:12:20", "throughput": 4050.91, "total_tokens": 166297600} {"current_steps": 20400, "total_steps": 93654, "loss": 1.0637, "learning_rate": 4.4783628471600636e-05, "epoch": 0.6534691524120699, "percentage": 21.78, "elapsed_time": "11:33:32", "remaining_time": "1 day, 17:30:26", "throughput": 4015.99, "total_tokens": 167116800} {"current_steps": 20500, "total_steps": 93654, "loss": 0.9601, "learning_rate": 4.473169100745871e-05, "epoch": 0.6566724325709526, "percentage": 21.89, "elapsed_time": "11:43:45", "remaining_time": "1 day, 17:51:22", "throughput": 3977.1, "total_tokens": 167936000} {"current_steps": 20600, "total_steps": 93654, "loss": 1.0388, "learning_rate": 4.4679526695142195e-05, "epoch": 0.6598757127298354, "percentage": 22.0, "elapsed_time": "11:54:59", "remaining_time": "1 day, 18:15:33", "throughput": 3933.76, "total_tokens": 168755200} {"current_steps": 20700, "total_steps": 93654, "loss": 0.998, "learning_rate": 4.4627136134365463e-05, "epoch": 0.6630789928887181, "percentage": 22.1, "elapsed_time": "12:06:28", "remaining_time": "1 day, 18:40:22", "throughput": 3890.31, "total_tokens": 169574400} {"current_steps": 20100, "total_steps": 93654, "loss": 1.009, "learning_rate": 4.493807381699595e-05, "epoch": 0.6438593119354219, "percentage": 21.46, "elapsed_time": "0:08:10", "remaining_time": "0:29:54", "throughput": 335754.59, "total_tokens": 164659200} {"current_steps": 20200, "total_steps": 93654, "loss": 0.9565, "learning_rate": 4.488682046954994e-05, "epoch": 0.6470625920943046, "percentage": 21.57, "elapsed_time": "0:16:10", "remaining_time": "0:58:50", "throughput": 170436.88, "total_tokens": 165478400} {"current_steps": 20300, "total_steps": 93654, "loss": 1.0225, "learning_rate": 4.483533849046155e-05, "epoch": 0.6502658722531872, "percentage": 21.68, "elapsed_time": "0:24:13", "remaining_time": "1:27:30", "throughput": 114441.94, "total_tokens": 166297600} {"current_steps": 20400, "total_steps": 93654, "loss": 1.0642, "learning_rate": 4.4783628471600636e-05, "epoch": 0.6534691524120699, "percentage": 21.78, "elapsed_time": "0:32:29", "remaining_time": "1:56:39", "throughput": 85729.51, "total_tokens": 167116800} {"current_steps": 20500, "total_steps": 93654, "loss": 0.9598, "learning_rate": 4.473169100745871e-05, "epoch": 0.6566724325709526, "percentage": 21.89, "elapsed_time": "0:40:04", "remaining_time": "2:23:01", "throughput": 69831.43, "total_tokens": 167936000} {"current_steps": 20600, "total_steps": 93654, "loss": 1.0391, "learning_rate": 4.4679526695142195e-05, "epoch": 0.6598757127298354, "percentage": 22.0, "elapsed_time": "0:47:45", "remaining_time": "2:49:21", "throughput": 58893.55, "total_tokens": 168755200} {"current_steps": 20700, "total_steps": 93654, "loss": 0.998, "learning_rate": 4.4627136134365463e-05, "epoch": 0.6630789928887181, "percentage": 22.1, "elapsed_time": "0:55:23", "remaining_time": "3:15:13", "throughput": 51023.28, "total_tokens": 169574400} {"current_steps": 20800, "total_steps": 93654, "loss": 1.0335, "learning_rate": 4.457451992744402e-05, "epoch": 0.6662822730476008, "percentage": 22.21, "elapsed_time": "1:03:02", "remaining_time": "3:40:47", "throughput": 45051.09, "total_tokens": 170393600} {"current_steps": 20900, "total_steps": 93654, "loss": 1.0459, "learning_rate": 4.452167867928751e-05, "epoch": 0.6694855532064834, "percentage": 22.32, "elapsed_time": "1:10:42", "remaining_time": "4:06:06", "throughput": 40360.57, "total_tokens": 171212800} {"current_steps": 21000, "total_steps": 93654, "loss": 0.9922, "learning_rate": 4.4468612997392824e-05, "epoch": 0.6726888333653661, "percentage": 22.42, "elapsed_time": "1:18:19", "remaining_time": "4:30:59", "throughput": 36604.36, "total_tokens": 172032000} {"current_steps": 21100, "total_steps": 93654, "loss": 1.0024, "learning_rate": 4.441532349183706e-05, "epoch": 0.6758921135242488, "percentage": 22.53, "elapsed_time": "1:26:11", "remaining_time": "4:56:20", "throughput": 33427.03, "total_tokens": 172851200} {"current_steps": 21200, "total_steps": 93654, "loss": 0.994, "learning_rate": 4.4361810775270554e-05, "epoch": 0.6790953936831315, "percentage": 22.64, "elapsed_time": "1:33:50", "remaining_time": "5:20:44", "throughput": 30842.2, "total_tokens": 173670400} {"current_steps": 21300, "total_steps": 93654, "loss": 0.9669, "learning_rate": 4.430807546290982e-05, "epoch": 0.6822986738420143, "percentage": 22.74, "elapsed_time": "1:41:28", "remaining_time": "5:44:42", "throughput": 28658.46, "total_tokens": 174489600} {"current_steps": 21400, "total_steps": 93654, "loss": 1.0029, "learning_rate": 4.425411817253048e-05, "epoch": 0.685501954000897, "percentage": 22.85, "elapsed_time": "1:49:07", "remaining_time": "6:08:26", "throughput": 26775.7, "total_tokens": 175308800} {"current_steps": 21500, "total_steps": 93654, "loss": 1.0158, "learning_rate": 4.419993952446013e-05, "epoch": 0.6887052341597796, "percentage": 22.96, "elapsed_time": "1:56:46", "remaining_time": "6:31:52", "throughput": 25139.0, "total_tokens": 176128000} {"current_steps": 21600, "total_steps": 93654, "loss": 1.0571, "learning_rate": 4.414554014157127e-05, "epoch": 0.6919085143186623, "percentage": 23.06, "elapsed_time": "2:04:26", "remaining_time": "6:55:05", "throughput": 23700.07, "total_tokens": 176947200} {"current_steps": 21700, "total_steps": 93654, "loss": 0.9647, "learning_rate": 4.4090920649274095e-05, "epoch": 0.695111794477545, "percentage": 23.17, "elapsed_time": "2:12:03", "remaining_time": "7:17:54", "throughput": 22434.06, "total_tokens": 177766400} {"current_steps": 21800, "total_steps": 93654, "loss": 0.9609, "learning_rate": 4.40360816755093e-05, "epoch": 0.6983150746364277, "percentage": 23.28, "elapsed_time": "2:19:40", "remaining_time": "7:40:24", "throughput": 21308.55, "total_tokens": 178585600} {"current_steps": 21900, "total_steps": 93654, "loss": 0.9524, "learning_rate": 4.3981023850740926e-05, "epoch": 0.7015183547953104, "percentage": 23.38, "elapsed_time": "2:27:18", "remaining_time": "8:02:39", "throughput": 20297.95, "total_tokens": 179404800} {"current_steps": 22000, "total_steps": 93654, "loss": 0.9641, "learning_rate": 4.392574780794901e-05, "epoch": 0.704721634954193, "percentage": 23.49, "elapsed_time": "2:34:56", "remaining_time": "8:24:37", "throughput": 19387.1, "total_tokens": 180224000} {"current_steps": 22100, "total_steps": 93654, "loss": 0.9838, "learning_rate": 4.387025418262242e-05, "epoch": 0.7079249151130758, "percentage": 23.6, "elapsed_time": "2:42:50", "remaining_time": "8:47:14", "throughput": 18529.29, "total_tokens": 181043200} {"current_steps": 22200, "total_steps": 93654, "loss": 1.0309, "learning_rate": 4.381454361275143e-05, "epoch": 0.7111281952719585, "percentage": 23.7, "elapsed_time": "2:50:29", "remaining_time": "9:08:43", "throughput": 17778.92, "total_tokens": 181862400} {"current_steps": 22300, "total_steps": 93654, "loss": 1.0029, "learning_rate": 4.3758616738820506e-05, "epoch": 0.7143314754308412, "percentage": 23.81, "elapsed_time": "2:58:07", "remaining_time": "9:29:56", "throughput": 17093.21, "total_tokens": 182681600} {"current_steps": 22400, "total_steps": 93654, "loss": 0.9842, "learning_rate": 4.370247420380085e-05, "epoch": 0.7175347555897239, "percentage": 23.92, "elapsed_time": "3:05:45", "remaining_time": "9:50:53", "throughput": 16464.29, "total_tokens": 183500800} {"current_steps": 22500, "total_steps": 93654, "loss": 0.9606, "learning_rate": 4.3646116653143046e-05, "epoch": 0.7207380357486066, "percentage": 24.02, "elapsed_time": "3:13:23", "remaining_time": "10:11:35", "throughput": 15884.69, "total_tokens": 184320000} {"current_steps": 22600, "total_steps": 93654, "loss": 0.9781, "learning_rate": 4.358954473476965e-05, "epoch": 0.7239413159074892, "percentage": 24.13, "elapsed_time": "3:21:03", "remaining_time": "10:32:05", "throughput": 15347.65, "total_tokens": 185139200} {"current_steps": 22700, "total_steps": 93654, "loss": 0.9823, "learning_rate": 4.353275909906772e-05, "epoch": 0.7271445960663719, "percentage": 24.24, "elapsed_time": "3:28:40", "remaining_time": "10:52:16", "throughput": 14851.9, "total_tokens": 185958400} {"current_steps": 22800, "total_steps": 93654, "loss": 0.988, "learning_rate": 4.3475760398881325e-05, "epoch": 0.7303478762252547, "percentage": 24.34, "elapsed_time": "3:36:20", "remaining_time": "11:12:17", "throughput": 14389.55, "total_tokens": 186777600} {"current_steps": 22900, "total_steps": 93654, "loss": 0.9878, "learning_rate": 4.3418549289504096e-05, "epoch": 0.7335511563841374, "percentage": 24.45, "elapsed_time": "3:43:59", "remaining_time": "11:32:03", "throughput": 13958.81, "total_tokens": 187596800} {"current_steps": 23000, "total_steps": 93654, "loss": 1.0091, "learning_rate": 4.3361126428671636e-05, "epoch": 0.7367544365430201, "percentage": 24.56, "elapsed_time": "3:51:37", "remaining_time": "11:51:33", "throughput": 13557.1, "total_tokens": 188416000} {"current_steps": 23100, "total_steps": 93654, "loss": 1.0383, "learning_rate": 4.330349247655398e-05, "epoch": 0.7399577167019028, "percentage": 24.67, "elapsed_time": "3:59:27", "remaining_time": "12:11:22", "throughput": 13171.05, "total_tokens": 189235200} {"current_steps": 23200, "total_steps": 93654, "loss": 0.9801, "learning_rate": 4.324564809574799e-05, "epoch": 0.7431609968607854, "percentage": 24.77, "elapsed_time": "4:07:07", "remaining_time": "12:30:27", "throughput": 12817.92, "total_tokens": 190054400} {"current_steps": 23300, "total_steps": 93654, "loss": 1.0095, "learning_rate": 4.318759395126979e-05, "epoch": 0.7463642770196681, "percentage": 24.88, "elapsed_time": "4:14:47", "remaining_time": "12:49:20", "throughput": 12485.57, "total_tokens": 190873600} {"current_steps": 23400, "total_steps": 93654, "loss": 0.9601, "learning_rate": 4.3129330710547035e-05, "epoch": 0.7495675571785508, "percentage": 24.99, "elapsed_time": "4:22:24", "remaining_time": "13:07:50", "throughput": 12174.94, "total_tokens": 191692800} {"current_steps": 23500, "total_steps": 93654, "loss": 0.9837, "learning_rate": 4.307085904341133e-05, "epoch": 0.7527708373374336, "percentage": 25.09, "elapsed_time": "4:30:02", "remaining_time": "13:26:08", "throughput": 11881.8, "total_tokens": 192512000} {"current_steps": 23600, "total_steps": 93654, "loss": 0.9647, "learning_rate": 4.3012179622090436e-05, "epoch": 0.7559741174963163, "percentage": 25.2, "elapsed_time": "4:37:39", "remaining_time": "13:44:13", "throughput": 11604.56, "total_tokens": 193331200} {"current_steps": 23700, "total_steps": 93654, "loss": 0.9439, "learning_rate": 4.295329312120063e-05, "epoch": 0.7591773976551989, "percentage": 25.31, "elapsed_time": "4:45:17", "remaining_time": "14:02:06", "throughput": 11341.9, "total_tokens": 194150400} {"current_steps": 23800, "total_steps": 93654, "loss": 0.9708, "learning_rate": 4.289420021773889e-05, "epoch": 0.7623806778140816, "percentage": 25.41, "elapsed_time": "4:52:56", "remaining_time": "14:19:46", "throughput": 11092.89, "total_tokens": 194969600} {"current_steps": 23900, "total_steps": 93654, "loss": 1.0109, "learning_rate": 4.283490159107513e-05, "epoch": 0.7655839579729643, "percentage": 25.52, "elapsed_time": "5:00:36", "remaining_time": "14:37:19", "throughput": 10855.38, "total_tokens": 195788800} {"current_steps": 24000, "total_steps": 93654, "loss": 1.0119, "learning_rate": 4.27753979229444e-05, "epoch": 0.768787238131847, "percentage": 25.63, "elapsed_time": "5:08:15", "remaining_time": "14:54:37", "throughput": 10630.21, "total_tokens": 196608000} {"current_steps": 24100, "total_steps": 93654, "loss": 0.9659, "learning_rate": 4.271568989743903e-05, "epoch": 0.7719905182907297, "percentage": 25.73, "elapsed_time": "5:16:04", "remaining_time": "15:12:13", "throughput": 10410.11, "total_tokens": 197427200} {"current_steps": 24200, "total_steps": 93654, "loss": 0.9729, "learning_rate": 4.265577820100076e-05, "epoch": 0.7751937984496124, "percentage": 25.84, "elapsed_time": "5:23:42", "remaining_time": "15:29:02", "throughput": 10207.08, "total_tokens": 198246400} {"current_steps": 24300, "total_steps": 93654, "loss": 0.9633, "learning_rate": 4.2595663522412884e-05, "epoch": 0.778397078608495, "percentage": 25.95, "elapsed_time": "5:31:20", "remaining_time": "15:45:40", "throughput": 10013.02, "total_tokens": 199065600} {"current_steps": 24400, "total_steps": 93654, "loss": 0.9687, "learning_rate": 4.253534655279232e-05, "epoch": 0.7816003587673778, "percentage": 26.05, "elapsed_time": "5:38:57", "remaining_time": "16:02:02", "throughput": 9828.58, "total_tokens": 199884800} {"current_steps": 24500, "total_steps": 93654, "loss": 1.0017, "learning_rate": 4.247482798558161e-05, "epoch": 0.7848036389262605, "percentage": 26.16, "elapsed_time": "5:46:35", "remaining_time": "16:18:18", "throughput": 9651.25, "total_tokens": 200704000} {"current_steps": 24600, "total_steps": 93654, "loss": 0.9905, "learning_rate": 4.241410851654102e-05, "epoch": 0.7880069190851432, "percentage": 26.27, "elapsed_time": "5:54:16", "remaining_time": "16:34:27", "throughput": 9480.77, "total_tokens": 201523200} {"current_steps": 24700, "total_steps": 93654, "loss": 1.0358, "learning_rate": 4.235318884374051e-05, "epoch": 0.7912101992440259, "percentage": 26.37, "elapsed_time": "6:01:54", "remaining_time": "16:50:19", "throughput": 9318.29, "total_tokens": 202342400} {"current_steps": 24800, "total_steps": 93654, "loss": 1.0105, "learning_rate": 4.229206966755172e-05, "epoch": 0.7944134794029086, "percentage": 26.48, "elapsed_time": "6:09:34", "remaining_time": "17:06:03", "throughput": 9162.11, "total_tokens": 203161600} {"current_steps": 24900, "total_steps": 93654, "loss": 0.9345, "learning_rate": 4.223075169063989e-05, "epoch": 0.7976167595617912, "percentage": 26.59, "elapsed_time": "6:17:12", "remaining_time": "17:21:32", "throughput": 9012.75, "total_tokens": 203980800} {"current_steps": 25000, "total_steps": 93654, "loss": 0.9655, "learning_rate": 4.21692356179558e-05, "epoch": 0.800820039720674, "percentage": 26.69, "elapsed_time": "6:24:50", "remaining_time": "17:36:50", "throughput": 8869.36, "total_tokens": 204800000} {"current_steps": 25100, "total_steps": 93654, "loss": 0.949, "learning_rate": 4.210752215672769e-05, "epoch": 0.8040233198795567, "percentage": 26.8, "elapsed_time": "6:32:36", "remaining_time": "17:52:18", "throughput": 8728.72, "total_tokens": 205619200} {"current_steps": 25200, "total_steps": 93654, "loss": 1.0082, "learning_rate": 4.204561201645307e-05, "epoch": 0.8072266000384394, "percentage": 26.91, "elapsed_time": "6:40:16", "remaining_time": "18:07:19", "throughput": 8595.7, "total_tokens": 206438400} {"current_steps": 25300, "total_steps": 93654, "loss": 1.0074, "learning_rate": 4.198350590889064e-05, "epoch": 0.8104298801973221, "percentage": 27.01, "elapsed_time": "6:47:57", "remaining_time": "18:22:11", "throughput": 8467.37, "total_tokens": 207257600} {"current_steps": 25400, "total_steps": 93654, "loss": 0.9638, "learning_rate": 4.192120454805203e-05, "epoch": 0.8136331603562047, "percentage": 27.12, "elapsed_time": "6:55:36", "remaining_time": "18:36:47", "throughput": 8344.42, "total_tokens": 208076800} {"current_steps": 25500, "total_steps": 93654, "loss": 0.9793, "learning_rate": 4.185870865019364e-05, "epoch": 0.8168364405150874, "percentage": 27.23, "elapsed_time": "7:03:14", "remaining_time": "18:51:13", "throughput": 8225.87, "total_tokens": 208896000} {"current_steps": 25600, "total_steps": 93654, "loss": 0.9515, "learning_rate": 4.17960189338084e-05, "epoch": 0.8200397206739701, "percentage": 27.33, "elapsed_time": "7:10:52", "remaining_time": "19:05:25", "throughput": 8111.93, "total_tokens": 209715200} {"current_steps": 25700, "total_steps": 93654, "loss": 0.9659, "learning_rate": 4.17331361196175e-05, "epoch": 0.8232430008328528, "percentage": 27.44, "elapsed_time": "7:18:30", "remaining_time": "19:19:27", "throughput": 8001.94, "total_tokens": 210534400} {"current_steps": 25800, "total_steps": 93654, "loss": 1.0496, "learning_rate": 4.167006093056209e-05, "epoch": 0.8264462809917356, "percentage": 27.55, "elapsed_time": "7:26:10", "remaining_time": "19:33:26", "throughput": 7894.97, "total_tokens": 211353600} {"current_steps": 25900, "total_steps": 93654, "loss": 0.9466, "learning_rate": 4.1606794091795e-05, "epoch": 0.8296495611506183, "percentage": 27.65, "elapsed_time": "7:33:48", "remaining_time": "19:47:10", "throughput": 7792.19, "total_tokens": 212172800} {"current_steps": 26000, "total_steps": 93654, "loss": 0.9308, "learning_rate": 4.154333633067238e-05, "epoch": 0.8328528413095009, "percentage": 27.76, "elapsed_time": "7:41:25", "remaining_time": "20:00:40", "throughput": 7693.19, "total_tokens": 212992000} {"current_steps": 26100, "total_steps": 93654, "loss": 0.9996, "learning_rate": 4.147968837674535e-05, "epoch": 0.8360561214683836, "percentage": 27.87, "elapsed_time": "7:49:15", "remaining_time": "20:14:34", "throughput": 7593.87, "total_tokens": 213811200} {"current_steps": 26200, "total_steps": 93654, "loss": 0.9862, "learning_rate": 4.141585096175162e-05, "epoch": 0.8392594016272663, "percentage": 27.98, "elapsed_time": "7:56:54", "remaining_time": "20:27:49", "throughput": 7500.84, "total_tokens": 214630400} {"current_steps": 26300, "total_steps": 93654, "loss": 1.0175, "learning_rate": 4.1351824819607056e-05, "epoch": 0.842462681786149, "percentage": 28.08, "elapsed_time": "8:04:33", "remaining_time": "20:40:56", "throughput": 7410.58, "total_tokens": 215449600} {"current_steps": 26400, "total_steps": 93654, "loss": 0.9903, "learning_rate": 4.128761068639723e-05, "epoch": 0.8456659619450317, "percentage": 28.19, "elapsed_time": "8:12:11", "remaining_time": "20:53:50", "throughput": 7323.39, "total_tokens": 216268800} {"current_steps": 26500, "total_steps": 93654, "loss": 1.0261, "learning_rate": 4.122320930036902e-05, "epoch": 0.8488692421039145, "percentage": 28.3, "elapsed_time": "8:19:50", "remaining_time": "21:06:38", "throughput": 7238.66, "total_tokens": 217088000} {"current_steps": 26600, "total_steps": 93654, "loss": 1.0048, "learning_rate": 4.1158621401922046e-05, "epoch": 0.8520725222627971, "percentage": 28.4, "elapsed_time": "8:27:27", "remaining_time": "21:19:12", "throughput": 7156.81, "total_tokens": 217907200} {"current_steps": 26700, "total_steps": 93654, "loss": 0.9659, "learning_rate": 4.109384773360023e-05, "epoch": 0.8552758024216798, "percentage": 28.51, "elapsed_time": "8:35:05", "remaining_time": "21:31:39", "throughput": 7077.31, "total_tokens": 218726400} {"current_steps": 26800, "total_steps": 93654, "loss": 1.0134, "learning_rate": 4.10288890400832e-05, "epoch": 0.8584790825805625, "percentage": 28.62, "elapsed_time": "8:42:44", "remaining_time": "21:43:59", "throughput": 6999.87, "total_tokens": 219545600} {"current_steps": 26900, "total_steps": 93654, "loss": 1.0011, "learning_rate": 4.0963746068177744e-05, "epoch": 0.8616823627394452, "percentage": 28.72, "elapsed_time": "8:50:25", "remaining_time": "21:56:16", "throughput": 6924.22, "total_tokens": 220364800} {"current_steps": 27000, "total_steps": 93654, "loss": 1.0777, "learning_rate": 4.089841956680927e-05, "epoch": 0.8648856428983279, "percentage": 28.83, "elapsed_time": "8:58:05", "remaining_time": "22:08:23", "throughput": 6850.78, "total_tokens": 221184000} {"current_steps": 27100, "total_steps": 93654, "loss": 1.0113, "learning_rate": 4.08329102870131e-05, "epoch": 0.8680889230572106, "percentage": 28.94, "elapsed_time": "9:05:57", "remaining_time": "22:20:47", "throughput": 6777.24, "total_tokens": 222003200} {"current_steps": 27200, "total_steps": 93654, "loss": 1.0182, "learning_rate": 4.076721898192597e-05, "epoch": 0.8712922032160932, "percentage": 29.04, "elapsed_time": "9:13:36", "remaining_time": "22:32:33", "throughput": 6708.14, "total_tokens": 222822400} {"current_steps": 27300, "total_steps": 93654, "loss": 0.9876, "learning_rate": 4.070134640677722e-05, "epoch": 0.874495483374976, "percentage": 29.15, "elapsed_time": "9:21:13", "remaining_time": "22:44:06", "throughput": 6641.38, "total_tokens": 223641600} {"current_steps": 27400, "total_steps": 93654, "loss": 0.9378, "learning_rate": 4.063529331888024e-05, "epoch": 0.8776987635338587, "percentage": 29.26, "elapsed_time": "9:28:53", "remaining_time": "22:55:34", "throughput": 6576.06, "total_tokens": 224460800} {"current_steps": 27500, "total_steps": 93654, "loss": 0.9864, "learning_rate": 4.056906047762368e-05, "epoch": 0.8809020436927414, "percentage": 29.36, "elapsed_time": "9:36:32", "remaining_time": "23:06:56", "throughput": 6512.37, "total_tokens": 225280000} {"current_steps": 27600, "total_steps": 93654, "loss": 0.9642, "learning_rate": 4.0502648644462774e-05, "epoch": 0.8841053238516241, "percentage": 29.47, "elapsed_time": "9:44:09", "remaining_time": "23:18:03", "throughput": 6450.77, "total_tokens": 226099200} {"current_steps": 27700, "total_steps": 93654, "loss": 0.968, "learning_rate": 4.043605858291053e-05, "epoch": 0.8873086040105067, "percentage": 29.58, "elapsed_time": "9:51:47", "remaining_time": "23:29:03", "throughput": 6390.7, "total_tokens": 226918400} {"current_steps": 27800, "total_steps": 93654, "loss": 1.0126, "learning_rate": 4.036929105852901e-05, "epoch": 0.8905118841693894, "percentage": 29.68, "elapsed_time": "9:59:26", "remaining_time": "23:40:00", "throughput": 6331.86, "total_tokens": 227737600} {"current_steps": 27900, "total_steps": 93654, "loss": 1.0438, "learning_rate": 4.0302346838920514e-05, "epoch": 0.8937151643282721, "percentage": 29.79, "elapsed_time": "10:07:07", "remaining_time": "23:50:52", "throughput": 6274.23, "total_tokens": 228556800} {"current_steps": 27100, "total_steps": 93654, "loss": 1.0116, "learning_rate": 4.08329102870131e-05, "epoch": 0.8680889230572106, "percentage": 28.94, "elapsed_time": "0:08:18", "remaining_time": "0:20:25", "throughput": 444990.85, "total_tokens": 222003200} {"current_steps": 27200, "total_steps": 93654, "loss": 1.0182, "learning_rate": 4.076721898192597e-05, "epoch": 0.8712922032160932, "percentage": 29.04, "elapsed_time": "0:16:20", "remaining_time": "0:39:56", "throughput": 227176.19, "total_tokens": 222822400} {"current_steps": 27300, "total_steps": 93654, "loss": 0.9877, "learning_rate": 4.070134640677722e-05, "epoch": 0.874495483374976, "percentage": 29.15, "elapsed_time": "0:24:34", "remaining_time": "0:59:43", "throughput": 151680.42, "total_tokens": 223641600} {"current_steps": 27400, "total_steps": 93654, "loss": 0.9377, "learning_rate": 4.063529331888024e-05, "epoch": 0.8776987635338587, "percentage": 29.26, "elapsed_time": "0:33:07", "remaining_time": "1:20:06", "throughput": 112909.09, "total_tokens": 224460800} {"current_steps": 27500, "total_steps": 93654, "loss": 0.9869, "learning_rate": 4.056906047762368e-05, "epoch": 0.8809020436927414, "percentage": 29.36, "elapsed_time": "0:41:15", "remaining_time": "1:39:15", "throughput": 90991.89, "total_tokens": 225280000} {"current_steps": 27100, "total_steps": 93654, "loss": 1.0113, "learning_rate": 4.08329102870131e-05, "epoch": 0.8680889230572106, "percentage": 28.94, "elapsed_time": "0:08:33", "remaining_time": "0:21:01", "throughput": 432271.71, "total_tokens": 222003200} {"current_steps": 27200, "total_steps": 93654, "loss": 1.0181, "learning_rate": 4.076721898192597e-05, "epoch": 0.8712922032160932, "percentage": 29.04, "elapsed_time": "0:16:46", "remaining_time": "0:40:59", "throughput": 221336.65, "total_tokens": 222822400} {"current_steps": 27300, "total_steps": 93654, "loss": 0.9882, "learning_rate": 4.070134640677722e-05, "epoch": 0.874495483374976, "percentage": 29.15, "elapsed_time": "0:25:12", "remaining_time": "1:01:15", "throughput": 147909.1, "total_tokens": 223641600} {"current_steps": 27400, "total_steps": 93654, "loss": 0.9378, "learning_rate": 4.063529331888024e-05, "epoch": 0.8776987635338587, "percentage": 29.26, "elapsed_time": "0:34:57", "remaining_time": "1:24:31", "throughput": 107010.21, "total_tokens": 224460800} {"current_steps": 27500, "total_steps": 93654, "loss": 0.9867, "learning_rate": 4.056906047762368e-05, "epoch": 0.8809020436927414, "percentage": 29.36, "elapsed_time": "0:44:59", "remaining_time": "1:48:13", "throughput": 83460.64, "total_tokens": 225280000} {"current_steps": 27600, "total_steps": 93654, "loss": 0.9645, "learning_rate": 4.0502648644462774e-05, "epoch": 0.8841053238516241, "percentage": 29.47, "elapsed_time": "0:55:30", "remaining_time": "2:12:50", "throughput": 67889.03, "total_tokens": 226099200} {"current_steps": 27700, "total_steps": 93654, "loss": 0.9678, "learning_rate": 4.043605858291053e-05, "epoch": 0.8873086040105067, "percentage": 29.58, "elapsed_time": "1:04:47", "remaining_time": "2:34:16", "throughput": 58371.6, "total_tokens": 226918400} {"current_steps": 27800, "total_steps": 93654, "loss": 1.0127, "learning_rate": 4.036929105852901e-05, "epoch": 0.8905118841693894, "percentage": 29.68, "elapsed_time": "1:16:38", "remaining_time": "3:01:34", "throughput": 49519.86, "total_tokens": 227737600} {"current_steps": 27900, "total_steps": 93654, "loss": 1.0439, "learning_rate": 4.0302346838920514e-05, "epoch": 0.8937151643282721, "percentage": 29.79, "elapsed_time": "1:24:14", "remaining_time": "3:18:31", "throughput": 45222.26, "total_tokens": 228556800} {"current_steps": 28000, "total_steps": 93654, "loss": 0.9393, "learning_rate": 4.02352266937187e-05, "epoch": 0.8969184444871549, "percentage": 29.9, "elapsed_time": "1:31:41", "remaining_time": "3:35:00", "throughput": 41690.33, "total_tokens": 229376000} {"current_steps": 28100, "total_steps": 93654, "loss": 0.8966, "learning_rate": 4.016793139457982e-05, "epoch": 0.9001217246460376, "percentage": 30.0, "elapsed_time": "1:39:38", "remaining_time": "3:52:28", "throughput": 38500.8, "total_tokens": 230195200} {"current_steps": 28200, "total_steps": 93654, "loss": 0.9858, "learning_rate": 4.0100461715173777e-05, "epoch": 0.9033250048049203, "percentage": 30.11, "elapsed_time": "1:47:09", "remaining_time": "4:08:43", "throughput": 35928.7, "total_tokens": 231014400} {"current_steps": 28100, "total_steps": 93654, "loss": 0.8966, "learning_rate": 4.016793139457982e-05, "epoch": 0.9001217246460376, "percentage": 30.0, "elapsed_time": "0:07:54", "remaining_time": "0:18:27", "throughput": 485096.52, "total_tokens": 230195200} {"current_steps": 28200, "total_steps": 93654, "loss": 0.9861, "learning_rate": 4.0100461715173777e-05, "epoch": 0.9033250048049203, "percentage": 30.11, "elapsed_time": "0:15:44", "remaining_time": "0:36:32", "throughput": 244585.08, "total_tokens": 231014400} {"current_steps": 28300, "total_steps": 93654, "loss": 1.0012, "learning_rate": 4.003281843117528e-05, "epoch": 0.9065282849638029, "percentage": 30.22, "elapsed_time": "0:23:35", "remaining_time": "0:54:28", "throughput": 163804.76, "total_tokens": 231833600} {"current_steps": 28400, "total_steps": 93654, "loss": 0.9602, "learning_rate": 3.9965002320254924e-05, "epoch": 0.9097315651226856, "percentage": 30.32, "elapsed_time": "0:31:24", "remaining_time": "1:12:11", "throughput": 123423.9, "total_tokens": 232652800} {"current_steps": 28500, "total_steps": 93654, "loss": 0.988, "learning_rate": 3.989701416207019e-05, "epoch": 0.9129348452815683, "percentage": 30.43, "elapsed_time": "0:39:13", "remaining_time": "1:29:40", "throughput": 99195.51, "total_tokens": 233472000} {"current_steps": 28600, "total_steps": 93654, "loss": 1.0339, "learning_rate": 3.9828854738256564e-05, "epoch": 0.916138125440451, "percentage": 30.54, "elapsed_time": "0:47:02", "remaining_time": "1:47:01", "throughput": 82993.74, "total_tokens": 234291200} {"current_steps": 28700, "total_steps": 93654, "loss": 1.0025, "learning_rate": 3.976052483241849e-05, "epoch": 0.9193414055993337, "percentage": 30.64, "elapsed_time": "0:54:51", "remaining_time": "2:04:08", "throughput": 71433.91, "total_tokens": 235110400} {"current_steps": 28800, "total_steps": 93654, "loss": 1.0335, "learning_rate": 3.969202523012038e-05, "epoch": 0.9225446857582165, "percentage": 30.75, "elapsed_time": "1:02:39", "remaining_time": "2:21:05", "throughput": 62761.44, "total_tokens": 235929600} {"current_steps": 28900, "total_steps": 93654, "loss": 0.9721, "learning_rate": 3.9623356718877605e-05, "epoch": 0.9257479659170991, "percentage": 30.86, "elapsed_time": "1:10:27", "remaining_time": "2:37:51", "throughput": 56008.14, "total_tokens": 236748800} {"current_steps": 29000, "total_steps": 93654, "loss": 0.9866, "learning_rate": 3.955452008814741e-05, "epoch": 0.9289512460759818, "percentage": 30.97, "elapsed_time": "1:18:15", "remaining_time": "2:54:28", "throughput": 50592.52, "total_tokens": 237568000} {"current_steps": 29100, "total_steps": 93654, "loss": 0.9863, "learning_rate": 3.9485516129319844e-05, "epoch": 0.9321545262348645, "percentage": 31.07, "elapsed_time": "1:26:16", "remaining_time": "3:11:22", "throughput": 46056.12, "total_tokens": 238387200} {"current_steps": 29200, "total_steps": 93654, "loss": 0.9902, "learning_rate": 3.9416345635708676e-05, "epoch": 0.9353578063937472, "percentage": 31.18, "elapsed_time": "1:34:01", "remaining_time": "3:27:32", "throughput": 42400.58, "total_tokens": 239206400} {"current_steps": 29300, "total_steps": 93654, "loss": 0.991, "learning_rate": 3.9347009402542256e-05, "epoch": 0.9385610865526299, "percentage": 31.29, "elapsed_time": "1:41:48", "remaining_time": "3:43:36", "throughput": 39293.84, "total_tokens": 240025600} {"current_steps": 29400, "total_steps": 93654, "loss": 0.9851, "learning_rate": 3.9277508226954394e-05, "epoch": 0.9417643667115125, "percentage": 31.39, "elapsed_time": "1:49:48", "remaining_time": "3:59:59", "throughput": 36554.23, "total_tokens": 240844800} {"current_steps": 29500, "total_steps": 93654, "loss": 1.0144, "learning_rate": 3.920784290797519e-05, "epoch": 0.9449676468703953, "percentage": 31.5, "elapsed_time": "1:57:53", "remaining_time": "4:16:23", "throughput": 34163.27, "total_tokens": 241664000} {"current_steps": 29600, "total_steps": 93654, "loss": 0.9529, "learning_rate": 3.9138014246521806e-05, "epoch": 0.948170927029278, "percentage": 31.61, "elapsed_time": "2:05:57", "remaining_time": "4:32:33", "throughput": 32085.95, "total_tokens": 242483200} {"current_steps": 29700, "total_steps": 93654, "loss": 0.9949, "learning_rate": 3.906802304538935e-05, "epoch": 0.9513742071881607, "percentage": 31.71, "elapsed_time": "2:14:02", "remaining_time": "4:48:38", "throughput": 30251.46, "total_tokens": 243302400} {"current_steps": 29800, "total_steps": 93654, "loss": 0.9596, "learning_rate": 3.899787010924152e-05, "epoch": 0.9545774873470434, "percentage": 31.82, "elapsed_time": "2:22:06", "remaining_time": "5:04:30", "throughput": 28629.8, "total_tokens": 244121600} {"current_steps": 29900, "total_steps": 93654, "loss": 0.9813, "learning_rate": 3.8927556244601495e-05, "epoch": 0.9577807675059261, "percentage": 31.93, "elapsed_time": "2:30:10", "remaining_time": "5:20:13", "throughput": 27183.26, "total_tokens": 244940800} {"current_steps": 30000, "total_steps": 93654, "loss": 0.9747, "learning_rate": 3.885708225984254e-05, "epoch": 0.9609840476648087, "percentage": 32.03, "elapsed_time": "2:38:15", "remaining_time": "5:35:47", "throughput": 25882.43, "total_tokens": 245760000} {"current_steps": 30100, "total_steps": 93654, "loss": 0.9933, "learning_rate": 3.878644896517879e-05, "epoch": 0.9641873278236914, "percentage": 32.14, "elapsed_time": "2:46:29", "remaining_time": "5:51:31", "throughput": 24684.78, "total_tokens": 246579200} {"current_steps": 30200, "total_steps": 93654, "loss": 0.964, "learning_rate": 3.87156571726559e-05, "epoch": 0.9673906079825741, "percentage": 32.25, "elapsed_time": "2:54:33", "remaining_time": "6:06:46", "throughput": 23620.79, "total_tokens": 247398400} {"current_steps": 30300, "total_steps": 93654, "loss": 0.9784, "learning_rate": 3.8644707696141704e-05, "epoch": 0.9705938881414569, "percentage": 32.35, "elapsed_time": "3:02:38", "remaining_time": "6:21:53", "throughput": 22649.99, "total_tokens": 248217600} {"current_steps": 30400, "total_steps": 93654, "loss": 1.0191, "learning_rate": 3.857360135131691e-05, "epoch": 0.9737971683003396, "percentage": 32.46, "elapsed_time": "3:10:44", "remaining_time": "6:36:53", "throughput": 21759.91, "total_tokens": 249036800} {"current_steps": 30500, "total_steps": 93654, "loss": 0.9769, "learning_rate": 3.8502338955665644e-05, "epoch": 0.9770004484592223, "percentage": 32.57, "elapsed_time": "3:18:48", "remaining_time": "6:51:38", "throughput": 20946.56, "total_tokens": 249856000} {"current_steps": 30600, "total_steps": 93654, "loss": 1.0179, "learning_rate": 3.843092132846613e-05, "epoch": 0.9802037286181049, "percentage": 32.67, "elapsed_time": "3:26:53", "remaining_time": "7:06:19", "throughput": 20193.18, "total_tokens": 250675200} {"current_steps": 30700, "total_steps": 93654, "loss": 0.9206, "learning_rate": 3.835934929078119e-05, "epoch": 0.9834070087769876, "percentage": 32.78, "elapsed_time": "3:34:57", "remaining_time": "7:20:48", "throughput": 19499.24, "total_tokens": 251494400} {"current_steps": 30800, "total_steps": 93654, "loss": 0.9686, "learning_rate": 3.828762366544888e-05, "epoch": 0.9866102889358703, "percentage": 32.89, "elapsed_time": "3:43:02", "remaining_time": "7:35:08", "throughput": 18854.7, "total_tokens": 252313600} {"current_steps": 30900, "total_steps": 93654, "loss": 0.9694, "learning_rate": 3.8215745277073e-05, "epoch": 0.989813569094753, "percentage": 32.99, "elapsed_time": "3:51:06", "remaining_time": "7:49:21", "throughput": 18254.81, "total_tokens": 253132800} {"current_steps": 31000, "total_steps": 93654, "loss": 0.8879, "learning_rate": 3.8143714952013584e-05, "epoch": 0.9930168492536358, "percentage": 33.1, "elapsed_time": "3:59:10", "remaining_time": "8:03:23", "throughput": 17696.48, "total_tokens": 253952000} {"current_steps": 31100, "total_steps": 93654, "loss": 0.9948, "learning_rate": 3.807153351837746e-05, "epoch": 0.9962201294125185, "percentage": 33.21, "elapsed_time": "4:07:32", "remaining_time": "8:17:53", "throughput": 17153.73, "total_tokens": 254771200} {"current_steps": 31200, "total_steps": 93654, "loss": 1.027, "learning_rate": 3.799920180600868e-05, "epoch": 0.9994234095714011, "percentage": 33.31, "elapsed_time": "4:15:39", "remaining_time": "8:31:46", "throughput": 16661.73, "total_tokens": 255590400} {"current_steps": 31300, "total_steps": 93654, "loss": 0.9665, "learning_rate": 3.792672064647898e-05, "epoch": 1.0026266897302838, "percentage": 33.42, "elapsed_time": "4:23:46", "remaining_time": "8:45:27", "throughput": 16201.66, "total_tokens": 256409600} {"current_steps": 31400, "total_steps": 93654, "loss": 0.8671, "learning_rate": 3.785409087307828e-05, "epoch": 1.0058299698891664, "percentage": 33.53, "elapsed_time": "4:31:48", "remaining_time": "8:58:54", "throughput": 15772.24, "total_tokens": 257228800} {"current_steps": 31500, "total_steps": 93654, "loss": 0.9356, "learning_rate": 3.778131332080503e-05, "epoch": 1.0090332500480492, "percentage": 33.63, "elapsed_time": "4:39:54", "remaining_time": "9:12:17", "throughput": 15365.45, "total_tokens": 258048000} {"current_steps": 31600, "total_steps": 93654, "loss": 0.9751, "learning_rate": 3.7708388826356636e-05, "epoch": 1.0122365302069318, "percentage": 33.74, "elapsed_time": "4:48:00", "remaining_time": "9:25:35", "throughput": 14979.89, "total_tokens": 258867200} {"current_steps": 31700, "total_steps": 93654, "loss": 0.8963, "learning_rate": 3.763531822811986e-05, "epoch": 1.0154398103658147, "percentage": 33.85, "elapsed_time": "4:56:03", "remaining_time": "9:38:36", "throughput": 14619.37, "total_tokens": 259686400} {"current_steps": 31800, "total_steps": 93654, "loss": 0.9021, "learning_rate": 3.756210236616117e-05, "epoch": 1.0186430905246973, "percentage": 33.95, "elapsed_time": "5:04:07", "remaining_time": "9:51:32", "throughput": 14276.31, "total_tokens": 260505600} {"current_steps": 31900, "total_steps": 93654, "loss": 0.947, "learning_rate": 3.7488742082217064e-05, "epoch": 1.02184637068358, "percentage": 34.06, "elapsed_time": "5:12:10", "remaining_time": "10:04:20", "throughput": 13951.53, "total_tokens": 261324800} {"current_steps": 32000, "total_steps": 93654, "loss": 0.9314, "learning_rate": 3.741523821968441e-05, "epoch": 1.0250496508424627, "percentage": 34.17, "elapsed_time": "5:20:15", "remaining_time": "10:17:02", "throughput": 13642.25, "total_tokens": 262144000} {"current_steps": 32100, "total_steps": 93654, "loss": 0.9523, "learning_rate": 3.734159162361077e-05, "epoch": 1.0282529310013453, "percentage": 34.28, "elapsed_time": "5:28:33", "remaining_time": "10:30:02", "throughput": 13339.19, "total_tokens": 262963200} {"current_steps": 32200, "total_steps": 93654, "loss": 0.9119, "learning_rate": 3.7267803140684635e-05, "epoch": 1.0314562111602281, "percentage": 34.38, "elapsed_time": "5:36:38", "remaining_time": "10:42:29", "throughput": 13059.41, "total_tokens": 263782400} {"current_steps": 32300, "total_steps": 93654, "loss": 0.9027, "learning_rate": 3.719387361922573e-05, "epoch": 1.0346594913191107, "percentage": 34.49, "elapsed_time": "5:44:40", "remaining_time": "10:54:43", "throughput": 12794.51, "total_tokens": 264601600} {"current_steps": 32400, "total_steps": 93654, "loss": 0.9126, "learning_rate": 3.711980390917523e-05, "epoch": 1.0378627714779936, "percentage": 34.6, "elapsed_time": "5:52:44", "remaining_time": "11:06:52", "throughput": 12540.87, "total_tokens": 265420800} {"current_steps": 32500, "total_steps": 93654, "loss": 0.909, "learning_rate": 3.7045594862086065e-05, "epoch": 1.0410660516368762, "percentage": 34.7, "elapsed_time": "6:00:49", "remaining_time": "11:18:56", "throughput": 12297.86, "total_tokens": 266240000} {"current_steps": 32600, "total_steps": 93654, "loss": 0.8809, "learning_rate": 3.697124733111299e-05, "epoch": 1.0442693317957588, "percentage": 34.81, "elapsed_time": "6:08:52", "remaining_time": "11:30:50", "throughput": 12066.42, "total_tokens": 267059200} {"current_steps": 32700, "total_steps": 93654, "loss": 0.9155, "learning_rate": 3.689676217100293e-05, "epoch": 1.0474726119546416, "percentage": 34.92, "elapsed_time": "6:16:55", "remaining_time": "11:42:36", "throughput": 11844.83, "total_tokens": 267878400} {"current_steps": 32800, "total_steps": 93654, "loss": 0.9514, "learning_rate": 3.682214023808506e-05, "epoch": 1.0506758921135242, "percentage": 35.02, "elapsed_time": "6:25:01", "remaining_time": "11:54:19", "throughput": 11631.35, "total_tokens": 268697600} {"current_steps": 32900, "total_steps": 93654, "loss": 0.9057, "learning_rate": 3.674738239026097e-05, "epoch": 1.053879172272407, "percentage": 35.13, "elapsed_time": "6:33:03", "remaining_time": "12:05:50", "throughput": 11428.09, "total_tokens": 269516800} {"current_steps": 33000, "total_steps": 93654, "loss": 0.9083, "learning_rate": 3.667248948699482e-05, "epoch": 1.0570824524312896, "percentage": 35.24, "elapsed_time": "6:41:08", "remaining_time": "12:17:17", "throughput": 11232.09, "total_tokens": 270336000} {"current_steps": 33100, "total_steps": 93654, "loss": 0.9211, "learning_rate": 3.659746238930345e-05, "epoch": 1.0602857325901724, "percentage": 35.34, "elapsed_time": "6:49:21", "remaining_time": "12:28:52", "throughput": 11040.04, "total_tokens": 271155200} {"current_steps": 33200, "total_steps": 93654, "loss": 0.9384, "learning_rate": 3.6522301959746514e-05, "epoch": 1.063489012749055, "percentage": 35.45, "elapsed_time": "6:57:26", "remaining_time": "12:40:07", "throughput": 10858.64, "total_tokens": 271974400} {"current_steps": 33300, "total_steps": 93654, "loss": 0.9296, "learning_rate": 3.6447009062416506e-05, "epoch": 1.0666922929079377, "percentage": 35.56, "elapsed_time": "7:05:30", "remaining_time": "12:51:12", "throughput": 10684.98, "total_tokens": 272793600} {"current_steps": 33400, "total_steps": 93654, "loss": 0.8913, "learning_rate": 3.637158456292885e-05, "epoch": 1.0698955730668205, "percentage": 35.66, "elapsed_time": "7:13:34", "remaining_time": "13:02:10", "throughput": 10517.77, "total_tokens": 273612800} {"current_steps": 33500, "total_steps": 93654, "loss": 0.9251, "learning_rate": 3.629602932841199e-05, "epoch": 1.073098853225703, "percentage": 35.77, "elapsed_time": "7:21:37", "remaining_time": "13:13:00", "throughput": 10356.86, "total_tokens": 274432000} {"current_steps": 33600, "total_steps": 93654, "loss": 0.9024, "learning_rate": 3.622034422749734e-05, "epoch": 1.076302133384586, "percentage": 35.88, "elapsed_time": "7:29:41", "remaining_time": "13:23:44", "throughput": 10201.58, "total_tokens": 275251200} {"current_steps": 33700, "total_steps": 93654, "loss": 0.8965, "learning_rate": 3.614453013030936e-05, "epoch": 1.0795054135434685, "percentage": 35.98, "elapsed_time": "7:37:44", "remaining_time": "13:34:19", "throughput": 10052.08, "total_tokens": 276070400} {"current_steps": 33800, "total_steps": 93654, "loss": 0.9058, "learning_rate": 3.606858790845555e-05, "epoch": 1.0827086937023511, "percentage": 36.09, "elapsed_time": "7:45:48", "remaining_time": "13:44:51", "throughput": 9907.24, "total_tokens": 276889600} {"current_steps": 33900, "total_steps": 93654, "loss": 0.9052, "learning_rate": 3.5992518435016376e-05, "epoch": 1.085911973861234, "percentage": 36.2, "elapsed_time": "7:53:52", "remaining_time": "13:55:16", "throughput": 9767.4, "total_tokens": 277708800} {"current_steps": 34000, "total_steps": 93654, "loss": 0.9027, "learning_rate": 3.59163225845353e-05, "epoch": 1.0891152540201166, "percentage": 36.3, "elapsed_time": "8:01:55", "remaining_time": "14:05:33", "throughput": 9632.36, "total_tokens": 278528000} {"current_steps": 34100, "total_steps": 93654, "loss": 0.8947, "learning_rate": 3.584000123300869e-05, "epoch": 1.0923185341789994, "percentage": 36.41, "elapsed_time": "8:10:02", "remaining_time": "14:15:50", "throughput": 9500.67, "total_tokens": 279347200} {"current_steps": 34200, "total_steps": 93654, "loss": 0.8998, "learning_rate": 3.576355525787576e-05, "epoch": 1.095521814337882, "percentage": 36.52, "elapsed_time": "8:18:08", "remaining_time": "14:25:59", "throughput": 9373.68, "total_tokens": 280166400} {"current_steps": 34300, "total_steps": 93654, "loss": 0.8951, "learning_rate": 3.5686985538008445e-05, "epoch": 1.0987250944967646, "percentage": 36.62, "elapsed_time": "8:26:12", "remaining_time": "14:35:57", "throughput": 9251.42, "total_tokens": 280985600} {"current_steps": 34400, "total_steps": 93654, "loss": 0.9009, "learning_rate": 3.561029295370138e-05, "epoch": 1.1019283746556474, "percentage": 36.73, "elapsed_time": "8:34:14", "remaining_time": "14:45:47", "throughput": 9133.2, "total_tokens": 281804800} {"current_steps": 34500, "total_steps": 93654, "loss": 0.9592, "learning_rate": 3.5533478386661665e-05, "epoch": 1.10513165481453, "percentage": 36.84, "elapsed_time": "8:42:18", "remaining_time": "14:55:33", "throughput": 9018.36, "total_tokens": 282624000} {"current_steps": 34600, "total_steps": 93654, "loss": 0.8587, "learning_rate": 3.545654271999886e-05, "epoch": 1.1083349349734128, "percentage": 36.94, "elapsed_time": "8:50:21", "remaining_time": "15:05:11", "throughput": 8907.39, "total_tokens": 283443200} {"current_steps": 34700, "total_steps": 93654, "loss": 0.906, "learning_rate": 3.5379486838214715e-05, "epoch": 1.1115382151322954, "percentage": 37.05, "elapsed_time": "8:58:25", "remaining_time": "15:14:45", "throughput": 8799.28, "total_tokens": 284262400} {"current_steps": 34800, "total_steps": 93654, "loss": 0.8925, "learning_rate": 3.530231162719307e-05, "epoch": 1.1147414952911783, "percentage": 37.16, "elapsed_time": "9:06:29", "remaining_time": "15:24:14", "throughput": 8694.26, "total_tokens": 285081600} {"current_steps": 34900, "total_steps": 93654, "loss": 0.8922, "learning_rate": 3.5225017974189644e-05, "epoch": 1.1179447754500609, "percentage": 37.26, "elapsed_time": "9:14:32", "remaining_time": "15:33:33", "throughput": 8592.78, "total_tokens": 285900800} {"current_steps": 35000, "total_steps": 93654, "loss": 0.884, "learning_rate": 3.5147606767821846e-05, "epoch": 1.1211480556089435, "percentage": 37.37, "elapsed_time": "9:22:35", "remaining_time": "15:42:48", "throughput": 8493.97, "total_tokens": 286720000} {"current_steps": 35100, "total_steps": 93654, "loss": 0.8941, "learning_rate": 3.507007889805856e-05, "epoch": 1.1243513357678263, "percentage": 37.48, "elapsed_time": "9:30:39", "remaining_time": "15:51:59", "throughput": 8397.8, "total_tokens": 287539200} {"current_steps": 35200, "total_steps": 93654, "loss": 0.9209, "learning_rate": 3.499243525620988e-05, "epoch": 1.127554615926709, "percentage": 37.59, "elapsed_time": "9:38:44", "remaining_time": "16:01:03", "throughput": 8304.26, "total_tokens": 288358400} {"current_steps": 35300, "total_steps": 93654, "loss": 0.9284, "learning_rate": 3.491467673491692e-05, "epoch": 1.1307578960855917, "percentage": 37.69, "elapsed_time": "9:46:47", "remaining_time": "16:10:00", "throughput": 8213.58, "total_tokens": 289177600} {"current_steps": 35400, "total_steps": 93654, "loss": 0.9036, "learning_rate": 3.483680422814152e-05, "epoch": 1.1339611762444743, "percentage": 37.8, "elapsed_time": "9:54:50", "remaining_time": "16:18:52", "throughput": 8125.27, "total_tokens": 289996800} {"current_steps": 35500, "total_steps": 93654, "loss": 0.8766, "learning_rate": 3.4758818631155934e-05, "epoch": 1.137164456403357, "percentage": 37.91, "elapsed_time": "10:02:53", "remaining_time": "16:27:37", "throughput": 8039.4, "total_tokens": 290816000} {"current_steps": 35600, "total_steps": 93654, "loss": 0.8996, "learning_rate": 3.4680720840532636e-05, "epoch": 1.1403677365622398, "percentage": 38.01, "elapsed_time": "10:10:57", "remaining_time": "16:36:18", "throughput": 7955.68, "total_tokens": 291635200} {"current_steps": 35700, "total_steps": 93654, "loss": 0.932, "learning_rate": 3.460251175413388e-05, "epoch": 1.1435710167211224, "percentage": 38.12, "elapsed_time": "10:19:03", "remaining_time": "16:44:56", "throughput": 7873.68, "total_tokens": 292454400} {"current_steps": 35800, "total_steps": 93654, "loss": 0.9095, "learning_rate": 3.452419227110151e-05, "epoch": 1.1467742968800052, "percentage": 38.23, "elapsed_time": "10:27:06", "remaining_time": "16:53:26", "throughput": 7794.27, "total_tokens": 293273600} {"current_steps": 35900, "total_steps": 93654, "loss": 0.9166, "learning_rate": 3.444576329184651e-05, "epoch": 1.1499775770388878, "percentage": 38.33, "elapsed_time": "10:35:09", "remaining_time": "17:01:49", "throughput": 7716.95, "total_tokens": 294092800} {"current_steps": 36000, "total_steps": 93654, "loss": 0.9445, "learning_rate": 3.436722571803874e-05, "epoch": 1.1531808571977704, "percentage": 38.44, "elapsed_time": "10:43:16", "remaining_time": "17:10:11", "throughput": 7640.99, "total_tokens": 294912000} {"current_steps": 36100, "total_steps": 93654, "loss": 0.8947, "learning_rate": 3.428858045259652e-05, "epoch": 1.1563841373566532, "percentage": 38.55, "elapsed_time": "10:51:26", "remaining_time": "17:18:35", "throughput": 7566.07, "total_tokens": 295731200} {"current_steps": 36200, "total_steps": 93654, "loss": 0.9532, "learning_rate": 3.420982839967624e-05, "epoch": 1.1595874175155358, "percentage": 38.65, "elapsed_time": "10:59:30", "remaining_time": "17:26:44", "throughput": 7494.15, "total_tokens": 296550400} {"current_steps": 36300, "total_steps": 93654, "loss": 0.9716, "learning_rate": 3.413097046466203e-05, "epoch": 1.1627906976744187, "percentage": 38.76, "elapsed_time": "11:07:35", "remaining_time": "17:34:47", "throughput": 7423.95, "total_tokens": 297369600} {"current_steps": 36400, "total_steps": 93654, "loss": 0.9364, "learning_rate": 3.405200755415527e-05, "epoch": 1.1659939778333013, "percentage": 38.87, "elapsed_time": "11:15:40", "remaining_time": "17:42:46", "throughput": 7355.33, "total_tokens": 298188800} {"current_steps": 36500, "total_steps": 93654, "loss": 0.8933, "learning_rate": 3.397294057596424e-05, "epoch": 1.169197257992184, "percentage": 38.97, "elapsed_time": "11:23:42", "remaining_time": "17:50:35", "throughput": 7288.87, "total_tokens": 299008000} {"current_steps": 36600, "total_steps": 93654, "loss": 0.8916, "learning_rate": 3.389377043909361e-05, "epoch": 1.1724005381510667, "percentage": 39.08, "elapsed_time": "11:31:46", "remaining_time": "17:58:22", "throughput": 7223.59, "total_tokens": 299827200} {"current_steps": 36700, "total_steps": 93654, "loss": 0.922, "learning_rate": 3.381449805373406e-05, "epoch": 1.1756038183099493, "percentage": 39.19, "elapsed_time": "11:39:48", "remaining_time": "18:06:01", "throughput": 7160.18, "total_tokens": 300646400} {"current_steps": 36800, "total_steps": 93654, "loss": 0.9093, "learning_rate": 3.3735124331251764e-05, "epoch": 1.1788070984688321, "percentage": 39.29, "elapsed_time": "11:47:51", "remaining_time": "18:13:36", "throughput": 7098.07, "total_tokens": 301465600} {"current_steps": 36900, "total_steps": 93654, "loss": 0.9553, "learning_rate": 3.3655650184177957e-05, "epoch": 1.1820103786277147, "percentage": 39.4, "elapsed_time": "11:55:55", "remaining_time": "18:21:07", "throughput": 7037.13, "total_tokens": 302284800} {"current_steps": 37000, "total_steps": 93654, "loss": 0.8768, "learning_rate": 3.357607652619839e-05, "epoch": 1.1852136587865976, "percentage": 39.51, "elapsed_time": "12:03:58", "remaining_time": "18:28:32", "throughput": 6977.82, "total_tokens": 303104000} {"current_steps": 37100, "total_steps": 93654, "loss": 0.9632, "learning_rate": 3.349640427214287e-05, "epoch": 1.1884169389454802, "percentage": 39.61, "elapsed_time": "12:12:12", "remaining_time": "18:36:09", "throughput": 6917.95, "total_tokens": 303923200} {"current_steps": 37200, "total_steps": 93654, "loss": 0.8682, "learning_rate": 3.341663433797474e-05, "epoch": 1.1916202191043628, "percentage": 39.72, "elapsed_time": "12:20:15", "remaining_time": "18:43:24", "throughput": 6861.1, "total_tokens": 304742400} {"current_steps": 37300, "total_steps": 93654, "loss": 0.9334, "learning_rate": 3.33367676407803e-05, "epoch": 1.1948234992632456, "percentage": 39.83, "elapsed_time": "12:28:19", "remaining_time": "18:50:35", "throughput": 6805.45, "total_tokens": 305561600} {"current_steps": 37400, "total_steps": 93654, "loss": 0.9073, "learning_rate": 3.3256805098758346e-05, "epoch": 1.1980267794221282, "percentage": 39.93, "elapsed_time": "12:36:24", "remaining_time": "18:57:43", "throughput": 6750.83, "total_tokens": 306380800} {"current_steps": 37500, "total_steps": 93654, "loss": 0.9343, "learning_rate": 3.3176747631209534e-05, "epoch": 1.201230059581011, "percentage": 40.04, "elapsed_time": "12:44:28", "remaining_time": "19:04:45", "throughput": 6697.44, "total_tokens": 307200000} {"current_steps": 37600, "total_steps": 93654, "loss": 0.8541, "learning_rate": 3.309659615852586e-05, "epoch": 1.2044333397398936, "percentage": 40.15, "elapsed_time": "12:52:30", "remaining_time": "19:11:39", "throughput": 6645.44, "total_tokens": 308019200} {"current_steps": 37700, "total_steps": 93654, "loss": 0.8889, "learning_rate": 3.301635160218005e-05, "epoch": 1.2076366198987762, "percentage": 40.25, "elapsed_time": "13:00:32", "remaining_time": "19:18:27", "throughput": 6594.58, "total_tokens": 308838400} {"current_steps": 37800, "total_steps": 93654, "loss": 0.883, "learning_rate": 3.293601488471499e-05, "epoch": 1.210839900057659, "percentage": 40.36, "elapsed_time": "13:08:35", "remaining_time": "19:25:14", "throughput": 6544.52, "total_tokens": 309657600} {"current_steps": 37900, "total_steps": 93654, "loss": 0.9474, "learning_rate": 3.285558692973312e-05, "epoch": 1.2140431802165417, "percentage": 40.47, "elapsed_time": "13:16:40", "remaining_time": "19:31:58", "throughput": 6495.25, "total_tokens": 310476800} {"current_steps": 38000, "total_steps": 93654, "loss": 0.904, "learning_rate": 3.277506866188577e-05, "epoch": 1.2172464603754245, "percentage": 40.57, "elapsed_time": "13:24:43", "remaining_time": "19:38:35", "throughput": 6447.23, "total_tokens": 311296000} {"current_steps": 38100, "total_steps": 93654, "loss": 0.8879, "learning_rate": 3.269446100686261e-05, "epoch": 1.220449740534307, "percentage": 40.68, "elapsed_time": "13:32:56", "remaining_time": "19:45:21", "throughput": 6398.87, "total_tokens": 312115200} {"current_steps": 38200, "total_steps": 93654, "loss": 0.9139, "learning_rate": 3.261376489138092e-05, "epoch": 1.22365302069319, "percentage": 40.79, "elapsed_time": "13:41:01", "remaining_time": "19:51:51", "throughput": 6352.55, "total_tokens": 312934400} {"current_steps": 38300, "total_steps": 93654, "loss": 0.959, "learning_rate": 3.253298124317502e-05, "epoch": 1.2268563008520725, "percentage": 40.9, "elapsed_time": "13:49:06", "remaining_time": "19:58:16", "throughput": 6307.09, "total_tokens": 313753600} {"current_steps": 38400, "total_steps": 93654, "loss": 0.9155, "learning_rate": 3.245211099098551e-05, "epoch": 1.2300595810109551, "percentage": 41.0, "elapsed_time": "13:57:11", "remaining_time": "20:04:38", "throughput": 6262.48, "total_tokens": 314572800} {"current_steps": 38500, "total_steps": 93654, "loss": 0.8758, "learning_rate": 3.237115506454869e-05, "epoch": 1.233262861169838, "percentage": 41.11, "elapsed_time": "14:05:15", "remaining_time": "20:10:53", "throughput": 6218.87, "total_tokens": 315392000} {"current_steps": 38600, "total_steps": 93654, "loss": 0.9116, "learning_rate": 3.2290114394585815e-05, "epoch": 1.2364661413287206, "percentage": 41.22, "elapsed_time": "14:13:20", "remaining_time": "20:17:05", "throughput": 6175.96, "total_tokens": 316211200} {"current_steps": 38700, "total_steps": 93654, "loss": 0.8743, "learning_rate": 3.22089899127924e-05, "epoch": 1.2396694214876034, "percentage": 41.32, "elapsed_time": "14:21:24", "remaining_time": "20:23:11", "throughput": 6133.96, "total_tokens": 317030400} {"current_steps": 38800, "total_steps": 93654, "loss": 0.9507, "learning_rate": 3.212778255182752e-05, "epoch": 1.242872701646486, "percentage": 41.43, "elapsed_time": "14:29:29", "remaining_time": "20:29:14", "throughput": 6092.66, "total_tokens": 317849600} {"current_steps": 38900, "total_steps": 93654, "loss": 0.9114, "learning_rate": 3.2046493245303066e-05, "epoch": 1.2460759818053686, "percentage": 41.54, "elapsed_time": "14:37:34", "remaining_time": "20:35:14", "throughput": 6052.06, "total_tokens": 318668800} {"current_steps": 39000, "total_steps": 93654, "loss": 0.9392, "learning_rate": 3.196512292777305e-05, "epoch": 1.2492792619642514, "percentage": 41.64, "elapsed_time": "14:45:37", "remaining_time": "20:41:06", "throughput": 6012.45, "total_tokens": 319488000} {"current_steps": 39100, "total_steps": 93654, "loss": 0.9277, "learning_rate": 3.1883672534722824e-05, "epoch": 1.252482542123134, "percentage": 41.75, "elapsed_time": "14:53:50", "remaining_time": "20:47:08", "throughput": 5972.43, "total_tokens": 320307200} {"current_steps": 39200, "total_steps": 93654, "loss": 0.8868, "learning_rate": 3.180214300255834e-05, "epoch": 1.2556858222820169, "percentage": 41.86, "elapsed_time": "15:01:54", "remaining_time": "20:52:52", "throughput": 5934.17, "total_tokens": 321126400} {"current_steps": 39300, "total_steps": 93654, "loss": 0.9129, "learning_rate": 3.1720535268595406e-05, "epoch": 1.2588891024408995, "percentage": 41.96, "elapsed_time": "15:09:58", "remaining_time": "20:58:32", "throughput": 5896.63, "total_tokens": 321945600} {"current_steps": 39400, "total_steps": 93654, "loss": 0.9237, "learning_rate": 3.1638850271048845e-05, "epoch": 1.262092382599782, "percentage": 42.07, "elapsed_time": "15:18:01", "remaining_time": "21:04:07", "throughput": 5859.77, "total_tokens": 322764800} {"current_steps": 39500, "total_steps": 93654, "loss": 0.8913, "learning_rate": 3.15570889490218e-05, "epoch": 1.265295662758665, "percentage": 42.18, "elapsed_time": "15:26:04", "remaining_time": "21:09:38", "throughput": 5823.56, "total_tokens": 323584000} {"current_steps": 39600, "total_steps": 93654, "loss": 0.9312, "learning_rate": 3.1475252242494855e-05, "epoch": 1.2684989429175475, "percentage": 42.28, "elapsed_time": "15:34:10", "remaining_time": "21:15:08", "throughput": 5787.7, "total_tokens": 324403200} {"current_steps": 39700, "total_steps": 93654, "loss": 0.8776, "learning_rate": 3.139334109231527e-05, "epoch": 1.2717022230764303, "percentage": 42.39, "elapsed_time": "15:42:14", "remaining_time": "21:20:32", "throughput": 5752.63, "total_tokens": 325222400} {"current_steps": 39800, "total_steps": 93654, "loss": 0.9715, "learning_rate": 3.131135644018617e-05, "epoch": 1.274905503235313, "percentage": 42.5, "elapsed_time": "15:50:20", "remaining_time": "21:25:54", "throughput": 5718.01, "total_tokens": 326041600} {"current_steps": 39900, "total_steps": 93654, "loss": 0.9268, "learning_rate": 3.1229299228655683e-05, "epoch": 1.2781087833941958, "percentage": 42.6, "elapsed_time": "15:58:24", "remaining_time": "21:31:10", "throughput": 5684.1, "total_tokens": 326860800} {"current_steps": 40000, "total_steps": 93654, "loss": 0.9286, "learning_rate": 3.1147170401106154e-05, "epoch": 1.2813120635530784, "percentage": 42.71, "elapsed_time": "16:06:28", "remaining_time": "21:36:22", "throughput": 5650.8, "total_tokens": 327680000} {"current_steps": 40100, "total_steps": 93654, "loss": 0.9317, "learning_rate": 3.106497090174325e-05, "epoch": 1.284515343711961, "percentage": 42.82, "elapsed_time": "16:14:41", "remaining_time": "21:41:43", "throughput": 5617.1, "total_tokens": 328499200} {"current_steps": 40200, "total_steps": 93654, "loss": 0.9152, "learning_rate": 3.098270167558514e-05, "epoch": 1.2877186238708438, "percentage": 42.92, "elapsed_time": "16:22:46", "remaining_time": "21:46:48", "throughput": 5584.81, "total_tokens": 329318400} {"current_steps": 40300, "total_steps": 93654, "loss": 0.9283, "learning_rate": 3.09003636684516e-05, "epoch": 1.2909219040297264, "percentage": 43.03, "elapsed_time": "16:30:52", "remaining_time": "21:51:50", "throughput": 5552.99, "total_tokens": 330137600} {"current_steps": 40400, "total_steps": 93654, "loss": 0.9307, "learning_rate": 3.081795782695317e-05, "epoch": 1.294125184188609, "percentage": 43.14, "elapsed_time": "16:38:56", "remaining_time": "21:56:46", "throughput": 5521.75, "total_tokens": 330956800} {"current_steps": 40500, "total_steps": 93654, "loss": 0.8917, "learning_rate": 3.0735485098480255e-05, "epoch": 1.2973284643474918, "percentage": 43.24, "elapsed_time": "16:46:59", "remaining_time": "22:01:37", "throughput": 5491.19, "total_tokens": 331776000} {"current_steps": 40600, "total_steps": 93654, "loss": 0.9321, "learning_rate": 3.0652946431192244e-05, "epoch": 1.3005317445063747, "percentage": 43.35, "elapsed_time": "16:55:04", "remaining_time": "22:06:27", "throughput": 5460.91, "total_tokens": 332595200} {"current_steps": 40700, "total_steps": 93654, "loss": 0.9211, "learning_rate": 3.057034277400658e-05, "epoch": 1.3037350246652573, "percentage": 43.46, "elapsed_time": "17:03:10", "remaining_time": "22:11:13", "throughput": 5431.07, "total_tokens": 333414400} {"current_steps": 40800, "total_steps": 93654, "loss": 0.913, "learning_rate": 3.048767507658788e-05, "epoch": 1.3069383048241399, "percentage": 43.56, "elapsed_time": "17:11:13", "remaining_time": "22:15:53", "throughput": 5401.88, "total_tokens": 334233600} {"current_steps": 40900, "total_steps": 93654, "loss": 0.9423, "learning_rate": 3.0404944289337034e-05, "epoch": 1.3101415849830227, "percentage": 43.67, "elapsed_time": "17:19:15", "remaining_time": "22:20:28", "throughput": 5373.25, "total_tokens": 335052800} {"current_steps": 41000, "total_steps": 93654, "loss": 0.9409, "learning_rate": 3.0322151363380202e-05, "epoch": 1.3133448651419053, "percentage": 43.78, "elapsed_time": "17:27:22", "remaining_time": "22:25:05", "throughput": 5344.63, "total_tokens": 335872000} {"current_steps": 41100, "total_steps": 93654, "loss": 0.9187, "learning_rate": 3.023929725055798e-05, "epoch": 1.316548145300788, "percentage": 43.88, "elapsed_time": "17:35:36", "remaining_time": "22:29:47", "throughput": 5315.93, "total_tokens": 336691200} {"current_steps": 41200, "total_steps": 93654, "loss": 1.0063, "learning_rate": 3.0156382903414383e-05, "epoch": 1.3197514254596707, "percentage": 43.99, "elapsed_time": "17:43:42", "remaining_time": "22:34:15", "throughput": 5288.27, "total_tokens": 337510400} {"current_steps": 41300, "total_steps": 93654, "loss": 0.8821, "learning_rate": 3.007340927518591e-05, "epoch": 1.3229547056185533, "percentage": 44.1, "elapsed_time": "17:51:45", "remaining_time": "22:38:37", "throughput": 5261.26, "total_tokens": 338329600} {"current_steps": 41400, "total_steps": 93654, "loss": 0.8968, "learning_rate": 2.999037731979063e-05, "epoch": 1.3261579857774362, "percentage": 44.21, "elapsed_time": "17:59:47", "remaining_time": "22:42:53", "throughput": 5234.78, "total_tokens": 339148800} {"current_steps": 41500, "total_steps": 93654, "loss": 0.955, "learning_rate": 2.9907287991817128e-05, "epoch": 1.3293612659363188, "percentage": 44.31, "elapsed_time": "18:07:52", "remaining_time": "22:47:09", "throughput": 5208.47, "total_tokens": 339968000} {"current_steps": 41600, "total_steps": 93654, "loss": 0.9096, "learning_rate": 2.9824142246513624e-05, "epoch": 1.3325645460952016, "percentage": 44.42, "elapsed_time": "18:15:55", "remaining_time": "22:51:20", "throughput": 5182.62, "total_tokens": 340787200} {"current_steps": 41700, "total_steps": 93654, "loss": 0.8828, "learning_rate": 2.9740941039776925e-05, "epoch": 1.3357678262540842, "percentage": 44.53, "elapsed_time": "18:23:58", "remaining_time": "22:55:26", "throughput": 5157.24, "total_tokens": 341606400} {"current_steps": 41800, "total_steps": 93654, "loss": 0.9614, "learning_rate": 2.9657685328141466e-05, "epoch": 1.3389711064129668, "percentage": 44.63, "elapsed_time": "18:32:00", "remaining_time": "22:59:28", "throughput": 5132.22, "total_tokens": 342425600} {"current_steps": 41900, "total_steps": 93654, "loss": 0.8739, "learning_rate": 2.95743760687683e-05, "epoch": 1.3421743865718496, "percentage": 44.74, "elapsed_time": "18:40:04", "remaining_time": "23:03:30", "throughput": 5107.43, "total_tokens": 343244800} {"current_steps": 42000, "total_steps": 93654, "loss": 0.9595, "learning_rate": 2.9491014219434105e-05, "epoch": 1.3453776667307322, "percentage": 44.85, "elapsed_time": "18:48:11", "remaining_time": "23:07:31", "throughput": 5082.81, "total_tokens": 344064000} {"current_steps": 42100, "total_steps": 93654, "loss": 0.9026, "learning_rate": 2.9407600738520162e-05, "epoch": 1.3485809468896148, "percentage": 44.95, "elapsed_time": "18:56:22", "remaining_time": "23:11:33", "throughput": 5058.22, "total_tokens": 344883200} {"current_steps": 42200, "total_steps": 93654, "loss": 0.9488, "learning_rate": 2.9324136585001348e-05, "epoch": 1.3517842270484977, "percentage": 45.06, "elapsed_time": "19:04:24", "remaining_time": "23:15:21", "throughput": 5034.68, "total_tokens": 345702400} {"current_steps": 42300, "total_steps": 93654, "loss": 0.9433, "learning_rate": 2.9240622718435107e-05, "epoch": 1.3549875072073805, "percentage": 45.17, "elapsed_time": "19:12:27", "remaining_time": "23:19:08", "throughput": 5011.31, "total_tokens": 346521600} {"current_steps": 42400, "total_steps": 93654, "loss": 0.8783, "learning_rate": 2.9157060098950395e-05, "epoch": 1.358190787366263, "percentage": 45.27, "elapsed_time": "19:20:30", "remaining_time": "23:22:50", "throughput": 4988.36, "total_tokens": 347340800} {"current_steps": 42500, "total_steps": 93654, "loss": 0.8925, "learning_rate": 2.9073449687236688e-05, "epoch": 1.3613940675251457, "percentage": 45.38, "elapsed_time": "19:31:01", "remaining_time": "23:29:28", "throughput": 4955.21, "total_tokens": 348160000} {"current_steps": 42600, "total_steps": 93654, "loss": 0.9417, "learning_rate": 2.8989792444532892e-05, "epoch": 1.3645973476840285, "percentage": 45.49, "elapsed_time": "19:41:17", "remaining_time": "23:35:43", "throughput": 4923.68, "total_tokens": 348979200} {"current_steps": 42700, "total_steps": 93654, "loss": 0.9262, "learning_rate": 2.890608933261633e-05, "epoch": 1.3678006278429111, "percentage": 45.59, "elapsed_time": "19:52:52", "remaining_time": "23:43:27", "throughput": 4887.33, "total_tokens": 349798400} {"current_steps": 42800, "total_steps": 93654, "loss": 0.9022, "learning_rate": 2.882234131379167e-05, "epoch": 1.3710039080017937, "percentage": 45.7, "elapsed_time": "20:03:57", "remaining_time": "23:50:31", "throughput": 4853.65, "total_tokens": 350617600} {"current_steps": 42900, "total_steps": 93654, "loss": 0.9306, "learning_rate": 2.8738549350879824e-05, "epoch": 1.3742071881606766, "percentage": 45.81, "elapsed_time": "20:15:26", "remaining_time": "23:57:57", "throughput": 4819.05, "total_tokens": 351436800} {"current_steps": 43000, "total_steps": 93654, "loss": 0.8878, "learning_rate": 2.8654714407206956e-05, "epoch": 1.3774104683195592, "percentage": 45.91, "elapsed_time": "20:27:09", "remaining_time": "1 day, 0:05:35", "throughput": 4784.19, "total_tokens": 352256000} {"current_steps": 43100, "total_steps": 93654, "loss": 0.939, "learning_rate": 2.8570837446593336e-05, "epoch": 1.380613748478442, "percentage": 46.02, "elapsed_time": "20:38:13", "remaining_time": "1 day, 0:12:22", "throughput": 4752.44, "total_tokens": 353075200} {"current_steps": 43200, "total_steps": 93654, "loss": 0.9062, "learning_rate": 2.8486919433342295e-05, "epoch": 1.3838170286373246, "percentage": 46.13, "elapsed_time": "20:48:20", "remaining_time": "1 day, 0:17:57", "throughput": 4724.85, "total_tokens": 353894400} {"current_steps": 43300, "total_steps": 93654, "loss": 0.8853, "learning_rate": 2.8402961332229143e-05, "epoch": 1.3870203087962074, "percentage": 46.23, "elapsed_time": "20:59:18", "remaining_time": "1 day, 0:24:28", "throughput": 4694.53, "total_tokens": 354713600} {"current_steps": 43400, "total_steps": 93654, "loss": 0.8932, "learning_rate": 2.831896410849005e-05, "epoch": 1.39022358895509, "percentage": 46.34, "elapsed_time": "21:14:42", "remaining_time": "1 day, 0:36:01", "throughput": 4648.54, "total_tokens": 355532800} {"current_steps": 43500, "total_steps": 93654, "loss": 0.9169, "learning_rate": 2.823492872781098e-05, "epoch": 1.3934268691139726, "percentage": 46.45, "elapsed_time": "21:24:50", "remaining_time": "1 day, 0:41:22", "throughput": 4622.51, "total_tokens": 356352000} {"current_steps": 43600, "total_steps": 93654, "loss": 0.9475, "learning_rate": 2.815085615631654e-05, "epoch": 1.3966301492728554, "percentage": 46.55, "elapsed_time": "21:33:58", "remaining_time": "1 day, 0:45:31", "throughput": 4600.42, "total_tokens": 357171200} {"current_steps": 43100, "total_steps": 93654, "loss": 0.9391, "learning_rate": 2.8570837446593336e-05, "epoch": 1.380613748478442, "percentage": 46.02, "elapsed_time": "0:07:41", "remaining_time": "0:09:01", "throughput": 765064.56, "total_tokens": 353075200} {"current_steps": 43200, "total_steps": 93654, "loss": 0.9061, "learning_rate": 2.8486919433342295e-05, "epoch": 1.3838170286373246, "percentage": 46.13, "elapsed_time": "0:15:12", "remaining_time": "0:17:45", "throughput": 387924.82, "total_tokens": 353894400} {"current_steps": 43300, "total_steps": 93654, "loss": 0.8854, "learning_rate": 2.8402961332229143e-05, "epoch": 1.3870203087962074, "percentage": 46.23, "elapsed_time": "0:22:41", "remaining_time": "0:26:23", "throughput": 260550.13, "total_tokens": 354713600} {"current_steps": 43400, "total_steps": 93654, "loss": 0.893, "learning_rate": 2.831896410849005e-05, "epoch": 1.39022358895509, "percentage": 46.34, "elapsed_time": "0:30:14", "remaining_time": "0:35:00", "throughput": 195990.27, "total_tokens": 355532800} {"current_steps": 43500, "total_steps": 93654, "loss": 0.9166, "learning_rate": 2.823492872781098e-05, "epoch": 1.3934268691139726, "percentage": 46.45, "elapsed_time": "0:37:46", "remaining_time": "0:43:33", "throughput": 157213.91, "total_tokens": 356352000} {"current_steps": 43600, "total_steps": 93654, "loss": 0.9473, "learning_rate": 2.815085615631654e-05, "epoch": 1.3966301492728554, "percentage": 46.55, "elapsed_time": "0:45:20", "remaining_time": "0:52:02", "throughput": 131310.39, "total_tokens": 357171200} {"current_steps": 43700, "total_steps": 93654, "loss": 0.9046, "learning_rate": 2.8066747360558966e-05, "epoch": 1.399833429431738, "percentage": 46.66, "elapsed_time": "0:52:52", "remaining_time": "1:00:26", "throughput": 112836.33, "total_tokens": 357990400} {"current_steps": 43800, "total_steps": 93654, "loss": 0.9325, "learning_rate": 2.798260330750689e-05, "epoch": 1.4030367095906209, "percentage": 46.77, "elapsed_time": "1:00:24", "remaining_time": "1:08:45", "throughput": 98985.35, "total_tokens": 358809600} {"current_steps": 43900, "total_steps": 93654, "loss": 0.9057, "learning_rate": 2.789842496453432e-05, "epoch": 1.4062399897495035, "percentage": 46.87, "elapsed_time": "1:07:56", "remaining_time": "1:17:00", "throughput": 88212.72, "total_tokens": 359628800} {"current_steps": 44000, "total_steps": 93654, "loss": 0.923, "learning_rate": 2.7814213299409475e-05, "epoch": 1.4094432699083863, "percentage": 46.98, "elapsed_time": "1:15:26", "remaining_time": "1:25:08", "throughput": 79626.29, "total_tokens": 360448000} {"current_steps": 44100, "total_steps": 93654, "loss": 0.8764, "learning_rate": 2.7729969280283662e-05, "epoch": 1.412646550067269, "percentage": 47.09, "elapsed_time": "1:23:22", "remaining_time": "1:33:40", "throughput": 72221.19, "total_tokens": 361267200} {"current_steps": 44200, "total_steps": 93654, "loss": 0.9295, "learning_rate": 2.7645693875680163e-05, "epoch": 1.4158498302261515, "percentage": 47.19, "elapsed_time": "1:30:54", "remaining_time": "1:41:42", "throughput": 66384.96, "total_tokens": 362086400} {"current_steps": 44300, "total_steps": 93654, "loss": 0.8883, "learning_rate": 2.7561388054483074e-05, "epoch": 1.4190531103850343, "percentage": 47.3, "elapsed_time": "1:38:28", "remaining_time": "1:49:43", "throughput": 61416.44, "total_tokens": 362905600} {"current_steps": 44400, "total_steps": 93654, "loss": 0.8784, "learning_rate": 2.7477052785926178e-05, "epoch": 1.422256390543917, "percentage": 47.41, "elapsed_time": "1:46:01", "remaining_time": "1:57:36", "throughput": 57179.79, "total_tokens": 363724800} {"current_steps": 44500, "total_steps": 93654, "loss": 0.949, "learning_rate": 2.7392689039581815e-05, "epoch": 1.4254596707027996, "percentage": 47.52, "elapsed_time": "1:53:35", "remaining_time": "2:05:28", "throughput": 53489.2, "total_tokens": 364544000} {"current_steps": 44600, "total_steps": 93654, "loss": 0.8738, "learning_rate": 2.7308297785349724e-05, "epoch": 1.4286629508616824, "percentage": 47.62, "elapsed_time": "2:01:06", "remaining_time": "2:13:11", "throughput": 50283.25, "total_tokens": 365363200} {"current_steps": 44700, "total_steps": 93654, "loss": 0.9074, "learning_rate": 2.7223879993445873e-05, "epoch": 1.431866231020565, "percentage": 47.73, "elapsed_time": "2:08:37", "remaining_time": "2:20:51", "throughput": 47448.1, "total_tokens": 366182400} {"current_steps": 44800, "total_steps": 93654, "loss": 0.953, "learning_rate": 2.713943663439135e-05, "epoch": 1.4350695111794478, "percentage": 47.84, "elapsed_time": "2:16:11", "remaining_time": "2:28:30", "throughput": 44914.46, "total_tokens": 367001600} {"current_steps": 44900, "total_steps": 93654, "loss": 0.8736, "learning_rate": 2.7054968679001174e-05, "epoch": 1.4382727913383304, "percentage": 47.94, "elapsed_time": "2:23:43", "remaining_time": "2:36:03", "throughput": 42654.04, "total_tokens": 367820800} {"current_steps": 45000, "total_steps": 93654, "loss": 0.8405, "learning_rate": 2.697047709837312e-05, "epoch": 1.4414760714972132, "percentage": 48.05, "elapsed_time": "2:31:14", "remaining_time": "2:43:31", "throughput": 40623.25, "total_tokens": 368640000} {"current_steps": 45100, "total_steps": 93654, "loss": 0.8852, "learning_rate": 2.6885962863876596e-05, "epoch": 1.4446793516560958, "percentage": 48.16, "elapsed_time": "2:39:14", "remaining_time": "2:51:25", "throughput": 38669.99, "total_tokens": 369459200} {"current_steps": 45200, "total_steps": 93654, "loss": 0.9029, "learning_rate": 2.6801426947141435e-05, "epoch": 1.4478826318149784, "percentage": 48.26, "elapsed_time": "2:46:48", "remaining_time": "2:58:48", "throughput": 36998.13, "total_tokens": 370278400} {"current_steps": 45300, "total_steps": 93654, "loss": 0.8751, "learning_rate": 2.671687032004676e-05, "epoch": 1.4510859119738613, "percentage": 48.37, "elapsed_time": "2:54:20", "remaining_time": "3:06:05", "throughput": 35476.65, "total_tokens": 371097600} {"current_steps": 45400, "total_steps": 93654, "loss": 0.9417, "learning_rate": 2.6632293954709785e-05, "epoch": 1.4542891921327439, "percentage": 48.48, "elapsed_time": "3:01:54", "remaining_time": "3:13:20", "throughput": 34076.4, "total_tokens": 371916800} {"current_steps": 45500, "total_steps": 93654, "loss": 0.9022, "learning_rate": 2.654769882347464e-05, "epoch": 1.4574924722916267, "percentage": 48.58, "elapsed_time": "3:09:25", "remaining_time": "3:20:28", "throughput": 32796.3, "total_tokens": 372736000} {"current_steps": 45600, "total_steps": 93654, "loss": 0.9017, "learning_rate": 2.646308589890123e-05, "epoch": 1.4606957524505093, "percentage": 48.69, "elapsed_time": "3:16:57", "remaining_time": "3:27:33", "throughput": 31611.24, "total_tokens": 373555200} {"current_steps": 45700, "total_steps": 93654, "loss": 0.883, "learning_rate": 2.637845615375397e-05, "epoch": 1.4638990326093921, "percentage": 48.8, "elapsed_time": "3:24:28", "remaining_time": "3:34:33", "throughput": 30515.65, "total_tokens": 374374400} {"current_steps": 45800, "total_steps": 93654, "loss": 0.9469, "learning_rate": 2.629381056099071e-05, "epoch": 1.4671023127682747, "percentage": 48.9, "elapsed_time": "3:32:02", "remaining_time": "3:41:33", "throughput": 29489.78, "total_tokens": 375193600} {"current_steps": 45900, "total_steps": 93654, "loss": 0.885, "learning_rate": 2.6209150093751473e-05, "epoch": 1.4703055929271573, "percentage": 49.01, "elapsed_time": "3:43:25", "remaining_time": "3:52:27", "throughput": 28049.01, "total_tokens": 376012800} {"current_steps": 46000, "total_steps": 93654, "loss": 0.9248, "learning_rate": 2.612447572534727e-05, "epoch": 1.4735088730860402, "percentage": 49.12, "elapsed_time": "4:00:11", "remaining_time": "4:08:49", "throughput": 26147.62, "total_tokens": 376832000} {"current_steps": 46100, "total_steps": 93654, "loss": 0.9041, "learning_rate": 2.6039788429248957e-05, "epoch": 1.4767121532449228, "percentage": 49.22, "elapsed_time": "4:17:23", "remaining_time": "4:25:30", "throughput": 24453.34, "total_tokens": 377651200} {"current_steps": 46200, "total_steps": 93654, "loss": 0.9431, "learning_rate": 2.5955089179075997e-05, "epoch": 1.4799154334038054, "percentage": 49.33, "elapsed_time": "4:34:13", "remaining_time": "4:41:40", "throughput": 23001.95, "total_tokens": 378470400} {"current_steps": 46300, "total_steps": 93654, "loss": 0.8893, "learning_rate": 2.5870378948585295e-05, "epoch": 1.4831187135626882, "percentage": 49.44, "elapsed_time": "4:50:56", "remaining_time": "4:57:34", "throughput": 21727.3, "total_tokens": 379289600} {"current_steps": 46400, "total_steps": 93654, "loss": 0.9181, "learning_rate": 2.5785658711659987e-05, "epoch": 1.4863219937215708, "percentage": 49.54, "elapsed_time": "5:07:44", "remaining_time": "5:13:23", "throughput": 20586.43, "total_tokens": 380108800} {"current_steps": 46500, "total_steps": 93654, "loss": 0.8921, "learning_rate": 2.570092944229826e-05, "epoch": 1.4895252738804536, "percentage": 49.65, "elapsed_time": "5:23:06", "remaining_time": "5:27:39", "throughput": 19648.86, "total_tokens": 380928000} {"current_steps": 46600, "total_steps": 93654, "loss": 0.8693, "learning_rate": 2.5616192114602127e-05, "epoch": 1.4927285540393362, "percentage": 49.76, "elapsed_time": "5:31:55", "remaining_time": "5:35:10", "throughput": 19167.88, "total_tokens": 381747200} {"current_steps": 46700, "total_steps": 93654, "loss": 0.9397, "learning_rate": 2.5531447702766254e-05, "epoch": 1.495931834198219, "percentage": 49.86, "elapsed_time": "5:40:45", "remaining_time": "5:42:36", "throughput": 18711.7, "total_tokens": 382566400} {"current_steps": 46800, "total_steps": 93654, "loss": 0.8526, "learning_rate": 2.5446697181066747e-05, "epoch": 1.4991351143571017, "percentage": 49.97, "elapsed_time": "5:49:34", "remaining_time": "5:49:59", "throughput": 18278.37, "total_tokens": 383385600} {"current_steps": 46900, "total_steps": 93654, "loss": 0.9122, "learning_rate": 2.536194152384997e-05, "epoch": 1.5023383945159843, "percentage": 50.08, "elapsed_time": "5:58:25", "remaining_time": "5:57:18", "throughput": 17865.43, "total_tokens": 384204800} {"current_steps": 47000, "total_steps": 93654, "loss": 0.8666, "learning_rate": 2.527718170552129e-05, "epoch": 1.505541674674867, "percentage": 50.18, "elapsed_time": "6:07:14", "remaining_time": "6:04:32", "throughput": 17473.56, "total_tokens": 385024000} {"current_steps": 47100, "total_steps": 93654, "loss": 0.911, "learning_rate": 2.519241870053396e-05, "epoch": 1.5087449548337497, "percentage": 50.29, "elapsed_time": "6:16:18", "remaining_time": "6:11:57", "throughput": 17088.69, "total_tokens": 385843200} {"current_steps": 47200, "total_steps": 93654, "loss": 0.974, "learning_rate": 2.5107653483377852e-05, "epoch": 1.5119482349926323, "percentage": 50.4, "elapsed_time": "6:25:10", "remaining_time": "6:19:05", "throughput": 16730.89, "total_tokens": 386662400} {"current_steps": 47300, "total_steps": 93654, "loss": 0.8986, "learning_rate": 2.502288702856824e-05, "epoch": 1.5151515151515151, "percentage": 50.51, "elapsed_time": "6:34:01", "remaining_time": "6:26:08", "throughput": 16389.72, "total_tokens": 387481600} {"current_steps": 47400, "total_steps": 93654, "loss": 0.8549, "learning_rate": 2.4938120310634682e-05, "epoch": 1.518354795310398, "percentage": 50.61, "elapsed_time": "6:42:49", "remaining_time": "6:33:05", "throughput": 16065.53, "total_tokens": 388300800} {"current_steps": 47500, "total_steps": 93654, "loss": 0.899, "learning_rate": 2.485335430410972e-05, "epoch": 1.5215580754692806, "percentage": 50.72, "elapsed_time": "6:51:39", "remaining_time": "6:39:59", "throughput": 15754.27, "total_tokens": 389120000} {"current_steps": 47600, "total_steps": 93654, "loss": 0.8622, "learning_rate": 2.4768589983517716e-05, "epoch": 1.5247613556281632, "percentage": 50.83, "elapsed_time": "7:00:28", "remaining_time": "6:46:49", "throughput": 15456.1, "total_tokens": 389939200} {"current_steps": 47700, "total_steps": 93654, "loss": 0.8334, "learning_rate": 2.4683828323363687e-05, "epoch": 1.527964635787046, "percentage": 50.93, "elapsed_time": "7:09:17", "remaining_time": "6:53:34", "throughput": 15170.66, "total_tokens": 390758400} {"current_steps": 47800, "total_steps": 93654, "loss": 0.9028, "learning_rate": 2.459907029812203e-05, "epoch": 1.5311679159459286, "percentage": 51.04, "elapsed_time": "7:18:08", "remaining_time": "7:00:18", "throughput": 14895.55, "total_tokens": 391577600} {"current_steps": 47900, "total_steps": 93654, "loss": 0.9259, "learning_rate": 2.4514316882225347e-05, "epoch": 1.5343711961048112, "percentage": 51.15, "elapsed_time": "7:27:01", "remaining_time": "7:06:59", "throughput": 14629.98, "total_tokens": 392396800} {"current_steps": 48000, "total_steps": 93654, "loss": 0.8639, "learning_rate": 2.442956905005328e-05, "epoch": 1.537574476263694, "percentage": 51.25, "elapsed_time": "7:35:51", "remaining_time": "7:13:35", "throughput": 14376.22, "total_tokens": 393216000} {"current_steps": 48100, "total_steps": 93654, "loss": 0.8828, "learning_rate": 2.434482777592125e-05, "epoch": 1.5407777564225769, "percentage": 51.36, "elapsed_time": "7:44:55", "remaining_time": "7:20:18", "throughput": 14125.5, "total_tokens": 394035200} {"current_steps": 48200, "total_steps": 93654, "loss": 0.8802, "learning_rate": 2.426009403406931e-05, "epoch": 1.5439810365814595, "percentage": 51.47, "elapsed_time": "7:53:45", "remaining_time": "7:26:46", "throughput": 13890.87, "total_tokens": 394854400} {"current_steps": 48300, "total_steps": 93654, "loss": 0.8811, "learning_rate": 2.4175368798650884e-05, "epoch": 1.547184316740342, "percentage": 51.57, "elapsed_time": "8:02:35", "remaining_time": "7:33:09", "throughput": 13664.71, "total_tokens": 395673600} {"current_steps": 48400, "total_steps": 93654, "loss": 0.8663, "learning_rate": 2.4090653043721612e-05, "epoch": 1.550387596899225, "percentage": 51.68, "elapsed_time": "8:11:24", "remaining_time": "7:39:27", "throughput": 13447.57, "total_tokens": 396492800} {"current_steps": 48500, "total_steps": 93654, "loss": 0.9452, "learning_rate": 2.4005947743228157e-05, "epoch": 1.5535908770581075, "percentage": 51.79, "elapsed_time": "8:20:14", "remaining_time": "7:45:43", "throughput": 13237.4, "total_tokens": 397312000} {"current_steps": 48600, "total_steps": 93654, "loss": 0.8968, "learning_rate": 2.3921253870996972e-05, "epoch": 1.55679415721699, "percentage": 51.89, "elapsed_time": "8:29:04", "remaining_time": "7:51:56", "throughput": 13034.34, "total_tokens": 398131200} {"current_steps": 48700, "total_steps": 93654, "loss": 0.9475, "learning_rate": 2.383657240072314e-05, "epoch": 1.559997437375873, "percentage": 52.0, "elapsed_time": "8:37:55", "remaining_time": "7:58:05", "throughput": 12838.04, "total_tokens": 398950400} {"current_steps": 48800, "total_steps": 93654, "loss": 0.9347, "learning_rate": 2.375190430595914e-05, "epoch": 1.5632007175347555, "percentage": 52.11, "elapsed_time": "8:46:48", "remaining_time": "8:04:12", "throughput": 12647.55, "total_tokens": 399769600} {"current_steps": 48900, "total_steps": 93654, "loss": 0.8969, "learning_rate": 2.366725056010369e-05, "epoch": 1.5664039976936381, "percentage": 52.21, "elapsed_time": "8:55:38", "remaining_time": "8:10:13", "throughput": 12464.44, "total_tokens": 400588800} {"current_steps": 49000, "total_steps": 93654, "loss": 0.8926, "learning_rate": 2.3582612136390556e-05, "epoch": 1.569607277852521, "percentage": 52.32, "elapsed_time": "9:04:30", "remaining_time": "8:16:12", "throughput": 12286.59, "total_tokens": 401408000} {"current_steps": 49100, "total_steps": 93654, "loss": 0.9027, "learning_rate": 2.349799000787733e-05, "epoch": 1.5728105580114038, "percentage": 52.43, "elapsed_time": "9:13:21", "remaining_time": "8:22:07", "throughput": 12114.71, "total_tokens": 402227200} {"current_steps": 49200, "total_steps": 93654, "loss": 0.8651, "learning_rate": 2.3413385147434285e-05, "epoch": 1.5760138381702864, "percentage": 52.53, "elapsed_time": "9:22:11", "remaining_time": "8:27:57", "throughput": 11948.61, "total_tokens": 403046400} {"current_steps": 49300, "total_steps": 93654, "loss": 0.8354, "learning_rate": 2.332879852773314e-05, "epoch": 1.579217118329169, "percentage": 52.64, "elapsed_time": "9:31:00", "remaining_time": "8:33:43", "throughput": 11787.92, "total_tokens": 403865600} {"current_steps": 49400, "total_steps": 93654, "loss": 0.903, "learning_rate": 2.3244231121235936e-05, "epoch": 1.5824203984880518, "percentage": 52.75, "elapsed_time": "9:39:52", "remaining_time": "8:39:28", "throughput": 11631.23, "total_tokens": 404684800} {"current_steps": 49500, "total_steps": 93654, "loss": 0.9085, "learning_rate": 2.3159683900183812e-05, "epoch": 1.5856236786469344, "percentage": 52.85, "elapsed_time": "9:48:41", "remaining_time": "8:45:07", "throughput": 11480.29, "total_tokens": 405504000} {"current_steps": 49600, "total_steps": 93654, "loss": 0.9002, "learning_rate": 2.3075157836585854e-05, "epoch": 1.588826958805817, "percentage": 52.96, "elapsed_time": "9:57:28", "remaining_time": "8:50:40", "throughput": 11334.3, "total_tokens": 406323200} {"current_steps": 49700, "total_steps": 93654, "loss": 0.8665, "learning_rate": 2.2990653902207875e-05, "epoch": 1.5920302389646999, "percentage": 53.07, "elapsed_time": "10:06:18", "remaining_time": "8:56:12", "throughput": 11191.97, "total_tokens": 407142400} {"current_steps": 49800, "total_steps": 93654, "loss": 0.9031, "learning_rate": 2.2906173068561324e-05, "epoch": 1.5952335191235827, "percentage": 53.17, "elapsed_time": "10:15:09", "remaining_time": "9:01:42", "throughput": 11053.08, "total_tokens": 407961600} {"current_steps": 49900, "total_steps": 93654, "loss": 0.9153, "learning_rate": 2.282171630689203e-05, "epoch": 1.5984367992824653, "percentage": 53.28, "elapsed_time": "10:24:01", "remaining_time": "9:07:09", "throughput": 10917.9, "total_tokens": 408780800} {"current_steps": 50000, "total_steps": 93654, "loss": 0.8904, "learning_rate": 2.2737284588169107e-05, "epoch": 1.601640079441348, "percentage": 53.39, "elapsed_time": "10:32:51", "remaining_time": "9:12:31", "throughput": 10787.16, "total_tokens": 409600000} {"current_steps": 50100, "total_steps": 93654, "loss": 0.8847, "learning_rate": 2.2652878883073736e-05, "epoch": 1.6048433596002307, "percentage": 53.49, "elapsed_time": "10:42:42", "remaining_time": "9:18:44", "throughput": 10642.9, "total_tokens": 410419200} {"current_steps": 50200, "total_steps": 93654, "loss": 0.8983, "learning_rate": 2.2568500161988023e-05, "epoch": 1.6080466397591133, "percentage": 53.6, "elapsed_time": "10:52:13", "remaining_time": "9:24:34", "throughput": 10508.73, "total_tokens": 411238400} {"current_steps": 50300, "total_steps": 93654, "loss": 0.9138, "learning_rate": 2.2484149394983882e-05, "epoch": 1.611249919917996, "percentage": 53.71, "elapsed_time": "11:01:36", "remaining_time": "9:30:15", "throughput": 10380.1, "total_tokens": 412057600} {"current_steps": 50400, "total_steps": 93654, "loss": 0.8536, "learning_rate": 2.239982755181181e-05, "epoch": 1.6144532000768788, "percentage": 53.82, "elapsed_time": "11:11:27", "remaining_time": "9:36:15", "throughput": 10248.27, "total_tokens": 412876800} {"current_steps": 50500, "total_steps": 93654, "loss": 0.9137, "learning_rate": 2.2315535601889814e-05, "epoch": 1.6176564802357616, "percentage": 53.92, "elapsed_time": "11:22:47", "remaining_time": "9:43:28", "throughput": 10098.19, "total_tokens": 413696000} {"current_steps": 50600, "total_steps": 93654, "loss": 0.8992, "learning_rate": 2.2231274514292196e-05, "epoch": 1.620859760394644, "percentage": 54.03, "elapsed_time": "11:31:15", "remaining_time": "9:48:10", "throughput": 9994.19, "total_tokens": 414515200} {"current_steps": 50700, "total_steps": 93654, "loss": 0.9211, "learning_rate": 2.214704525773846e-05, "epoch": 1.6240630405535268, "percentage": 54.14, "elapsed_time": "11:39:35", "remaining_time": "9:52:42", "throughput": 9894.69, "total_tokens": 415334400} {"current_steps": 50800, "total_steps": 93654, "loss": 0.9231, "learning_rate": 2.2062848800582168e-05, "epoch": 1.6272663207124096, "percentage": 54.24, "elapsed_time": "11:49:04", "remaining_time": "9:58:09", "throughput": 9781.7, "total_tokens": 416153600} {"current_steps": 50900, "total_steps": 93654, "loss": 0.8579, "learning_rate": 2.197868611079978e-05, "epoch": 1.6304696008712922, "percentage": 54.35, "elapsed_time": "11:57:56", "remaining_time": "10:03:02", "throughput": 9679.87, "total_tokens": 416972800} {"current_steps": 51000, "total_steps": 93654, "loss": 0.8802, "learning_rate": 2.189455815597957e-05, "epoch": 1.6336728810301748, "percentage": 54.46, "elapsed_time": "12:06:50", "remaining_time": "10:07:53", "throughput": 9580.15, "total_tokens": 417792000} {"current_steps": 51100, "total_steps": 93654, "loss": 0.897, "learning_rate": 2.1810465903310445e-05, "epoch": 1.6368761611890577, "percentage": 54.56, "elapsed_time": "12:14:58", "remaining_time": "10:12:03", "throughput": 9492.56, "total_tokens": 418611200} {"current_steps": 51200, "total_steps": 93654, "loss": 0.9145, "learning_rate": 2.1726410319570874e-05, "epoch": 1.6400794413479403, "percentage": 54.67, "elapsed_time": "12:22:58", "remaining_time": "10:16:03", "throughput": 9408.89, "total_tokens": 419430400} {"current_steps": 51300, "total_steps": 93654, "loss": 0.9656, "learning_rate": 2.164239237111776e-05, "epoch": 1.6432827215068229, "percentage": 54.78, "elapsed_time": "12:31:28", "remaining_time": "10:20:25", "throughput": 9320.55, "total_tokens": 420249600} {"current_steps": 51400, "total_steps": 93654, "loss": 0.8937, "learning_rate": 2.1558413023875334e-05, "epoch": 1.6464860016657057, "percentage": 54.88, "elapsed_time": "12:39:42", "remaining_time": "10:24:31", "throughput": 9237.43, "total_tokens": 421068800} {"current_steps": 51500, "total_steps": 93654, "loss": 0.8966, "learning_rate": 2.147447324332403e-05, "epoch": 1.6496892818245885, "percentage": 54.99, "elapsed_time": "12:47:44", "remaining_time": "10:28:24", "throughput": 9158.72, "total_tokens": 421888000} {"current_steps": 51600, "total_steps": 93654, "loss": 0.9922, "learning_rate": 2.1390573994489377e-05, "epoch": 1.6528925619834711, "percentage": 55.1, "elapsed_time": "12:55:56", "remaining_time": "10:32:23", "throughput": 9079.5, "total_tokens": 422707200} {"current_steps": 51700, "total_steps": 93654, "loss": 0.9201, "learning_rate": 2.1306716241930968e-05, "epoch": 1.6560958421423537, "percentage": 55.2, "elapsed_time": "13:04:08", "remaining_time": "10:36:19", "throughput": 9001.99, "total_tokens": 423526400} {"current_steps": 51800, "total_steps": 93654, "loss": 0.9039, "learning_rate": 2.1222900949731297e-05, "epoch": 1.6592991223012366, "percentage": 55.31, "elapsed_time": "13:12:29", "remaining_time": "10:40:19", "throughput": 8924.24, "total_tokens": 424345600} {"current_steps": 51900, "total_steps": 93654, "loss": 0.968, "learning_rate": 2.1139129081484734e-05, "epoch": 1.6625024024601192, "percentage": 55.42, "elapsed_time": "13:23:03", "remaining_time": "10:46:04", "throughput": 8823.78, "total_tokens": 425164800} {"current_steps": 52000, "total_steps": 93654, "loss": 0.9064, "learning_rate": 2.1055401600286386e-05, "epoch": 1.6657056826190018, "percentage": 55.52, "elapsed_time": "13:31:29", "remaining_time": "10:50:02", "throughput": 8748.95, "total_tokens": 425984000} {"current_steps": 52100, "total_steps": 93654, "loss": 0.8786, "learning_rate": 2.0971719468721077e-05, "epoch": 1.6689089627778846, "percentage": 55.63, "elapsed_time": "13:40:07", "remaining_time": "10:54:06", "throughput": 8673.54, "total_tokens": 426803200} {"current_steps": 52200, "total_steps": 93654, "loss": 0.9213, "learning_rate": 2.0888083648852267e-05, "epoch": 1.6721122429367674, "percentage": 55.74, "elapsed_time": "13:47:54", "remaining_time": "10:57:28", "throughput": 8608.43, "total_tokens": 427622400} {"current_steps": 52300, "total_steps": 93654, "loss": 0.944, "learning_rate": 2.0804495102210975e-05, "epoch": 1.6753155230956498, "percentage": 55.84, "elapsed_time": "13:56:47", "remaining_time": "11:01:39", "throughput": 8533.38, "total_tokens": 428441600} {"current_steps": 52400, "total_steps": 93654, "loss": 0.8767, "learning_rate": 2.0720954789784753e-05, "epoch": 1.6785188032545326, "percentage": 55.95, "elapsed_time": "14:05:28", "remaining_time": "11:05:38", "throughput": 8461.9, "total_tokens": 429260800} {"current_steps": 52500, "total_steps": 93654, "loss": 0.9095, "learning_rate": 2.0637463672006595e-05, "epoch": 1.6817220834134154, "percentage": 56.06, "elapsed_time": "14:13:21", "remaining_time": "11:08:55", "throughput": 8399.82, "total_tokens": 430080000} {"current_steps": 52600, "total_steps": 93654, "loss": 0.8976, "learning_rate": 2.0554022708743943e-05, "epoch": 1.684925363572298, "percentage": 56.16, "elapsed_time": "14:21:21", "remaining_time": "11:12:17", "throughput": 8337.57, "total_tokens": 430899200} {"current_steps": 52700, "total_steps": 93654, "loss": 0.9377, "learning_rate": 2.0470632859287628e-05, "epoch": 1.6881286437311807, "percentage": 56.27, "elapsed_time": "14:29:49", "remaining_time": "11:15:57", "throughput": 8272.09, "total_tokens": 431718400} {"current_steps": 52800, "total_steps": 93654, "loss": 0.8911, "learning_rate": 2.0387295082340835e-05, "epoch": 1.6913319238900635, "percentage": 56.38, "elapsed_time": "14:38:59", "remaining_time": "11:20:07", "throughput": 8201.37, "total_tokens": 432537600} {"current_steps": 52900, "total_steps": 93654, "loss": 0.8771, "learning_rate": 2.0304010336008112e-05, "epoch": 1.694535204048946, "percentage": 56.48, "elapsed_time": "14:47:15", "remaining_time": "11:23:32", "throughput": 8140.3, "total_tokens": 433356800} {"current_steps": 53000, "total_steps": 93654, "loss": 0.9529, "learning_rate": 2.0220779577784298e-05, "epoch": 1.6977384842078287, "percentage": 56.59, "elapsed_time": "14:56:00", "remaining_time": "11:27:17", "throughput": 8076.15, "total_tokens": 434176000} {"current_steps": 53100, "total_steps": 93654, "loss": 0.8813, "learning_rate": 2.0137603764543573e-05, "epoch": 1.7009417643667115, "percentage": 56.7, "elapsed_time": "15:04:41", "remaining_time": "11:30:56", "throughput": 8013.64, "total_tokens": 434995200} {"current_steps": 53200, "total_steps": 93654, "loss": 0.8268, "learning_rate": 2.0054483852528435e-05, "epoch": 1.7041450445255943, "percentage": 56.8, "elapsed_time": "15:13:01", "remaining_time": "11:34:16", "throughput": 7955.48, "total_tokens": 435814400} {"current_steps": 53300, "total_steps": 93654, "loss": 0.9116, "learning_rate": 1.9971420797338708e-05, "epoch": 1.707348324684477, "percentage": 56.91, "elapsed_time": "15:20:57", "remaining_time": "11:37:15", "throughput": 7901.83, "total_tokens": 436633600} {"current_steps": 53400, "total_steps": 93654, "loss": 0.8564, "learning_rate": 1.9888415553920525e-05, "epoch": 1.7105516048433596, "percentage": 57.02, "elapsed_time": "15:28:41", "remaining_time": "11:40:03", "throughput": 7850.77, "total_tokens": 437452800} {"current_steps": 53500, "total_steps": 93654, "loss": 0.8656, "learning_rate": 1.9805469076555418e-05, "epoch": 1.7137548850022424, "percentage": 57.13, "elapsed_time": "15:36:33", "remaining_time": "11:42:55", "throughput": 7799.32, "total_tokens": 438272000} {"current_steps": 53600, "total_steps": 93654, "loss": 0.8819, "learning_rate": 1.9722582318849274e-05, "epoch": 1.716958165161125, "percentage": 57.23, "elapsed_time": "15:44:20", "remaining_time": "11:45:40", "throughput": 7749.55, "total_tokens": 439091200} {"current_steps": 53700, "total_steps": 93654, "loss": 0.9118, "learning_rate": 1.9639756233721433e-05, "epoch": 1.7201614453200076, "percentage": 57.34, "elapsed_time": "15:52:00", "remaining_time": "11:48:19", "throughput": 7701.38, "total_tokens": 439910400} {"current_steps": 53800, "total_steps": 93654, "loss": 0.8578, "learning_rate": 1.9556991773393686e-05, "epoch": 1.7233647254788904, "percentage": 57.45, "elapsed_time": "15:59:55", "remaining_time": "11:51:05", "throughput": 7652.12, "total_tokens": 440729600} {"current_steps": 53900, "total_steps": 93654, "loss": 0.8907, "learning_rate": 1.9474289889379334e-05, "epoch": 1.7265680056377732, "percentage": 57.55, "elapsed_time": "16:07:46", "remaining_time": "11:53:46", "throughput": 7604.26, "total_tokens": 441548800} {"current_steps": 54000, "total_steps": 93654, "loss": 0.8853, "learning_rate": 1.9391651532472296e-05, "epoch": 1.7297712857966556, "percentage": 57.66, "elapsed_time": "16:15:34", "remaining_time": "11:56:24", "throughput": 7557.33, "total_tokens": 442368000} {"current_steps": 54100, "total_steps": 93654, "loss": 0.8942, "learning_rate": 1.930907765273611e-05, "epoch": 1.7329745659555384, "percentage": 57.77, "elapsed_time": "16:23:40", "remaining_time": "11:59:11", "throughput": 7508.98, "total_tokens": 443187200} {"current_steps": 54200, "total_steps": 93654, "loss": 0.861, "learning_rate": 1.922656919949306e-05, "epoch": 1.7361778461144213, "percentage": 57.87, "elapsed_time": "16:31:35", "remaining_time": "12:01:49", "throughput": 7462.79, "total_tokens": 444006400} {"current_steps": 54300, "total_steps": 93654, "loss": 0.8764, "learning_rate": 1.914412712131325e-05, "epoch": 1.7393811262733039, "percentage": 57.98, "elapsed_time": "16:39:32", "remaining_time": "12:04:25", "throughput": 7417.18, "total_tokens": 444825600} {"current_steps": 54400, "total_steps": 93654, "loss": 0.9054, "learning_rate": 1.906175236600366e-05, "epoch": 1.7425844064321865, "percentage": 58.09, "elapsed_time": "16:47:42", "remaining_time": "12:07:08", "throughput": 7370.62, "total_tokens": 445644800} {"current_steps": 54500, "total_steps": 93654, "loss": 0.9166, "learning_rate": 1.8979445880597332e-05, "epoch": 1.7457876865910693, "percentage": 58.19, "elapsed_time": "16:55:44", "remaining_time": "12:09:44", "throughput": 7325.72, "total_tokens": 446464000} {"current_steps": 54600, "total_steps": 93654, "loss": 0.893, "learning_rate": 1.8897208611342392e-05, "epoch": 1.748990966749952, "percentage": 58.3, "elapsed_time": "17:03:41", "remaining_time": "12:12:12", "throughput": 7282.24, "total_tokens": 447283200} {"current_steps": 54700, "total_steps": 93654, "loss": 0.8883, "learning_rate": 1.881504150369125e-05, "epoch": 1.7521942469088345, "percentage": 58.41, "elapsed_time": "17:11:24", "remaining_time": "12:14:30", "throughput": 7241.0, "total_tokens": 448102400} {"current_steps": 54800, "total_steps": 93654, "loss": 0.9114, "learning_rate": 1.873294550228965e-05, "epoch": 1.7553975270677173, "percentage": 58.51, "elapsed_time": "17:19:12", "remaining_time": "12:16:48", "throughput": 7199.71, "total_tokens": 448921600} {"current_steps": 54900, "total_steps": 93654, "loss": 0.9675, "learning_rate": 1.8650921550965884e-05, "epoch": 1.7586008072266002, "percentage": 58.62, "elapsed_time": "17:26:49", "remaining_time": "12:18:57", "throughput": 7160.35, "total_tokens": 449740800} {"current_steps": 55000, "total_steps": 93654, "loss": 0.9055, "learning_rate": 1.8568970592719903e-05, "epoch": 1.7618040873854828, "percentage": 58.73, "elapsed_time": "17:34:26", "remaining_time": "12:21:04", "throughput": 7121.57, "total_tokens": 450560000} {"current_steps": 55100, "total_steps": 93654, "loss": 0.8753, "learning_rate": 1.8487093569712482e-05, "epoch": 1.7650073675443654, "percentage": 58.83, "elapsed_time": "17:42:11", "remaining_time": "12:23:13", "throughput": 7082.46, "total_tokens": 451379200} {"current_steps": 55100, "total_steps": 93654, "loss": 0.8754, "learning_rate": 1.8487093569712482e-05, "epoch": 1.7650073675443654, "percentage": 58.83, "elapsed_time": "0:08:21", "remaining_time": "0:05:50", "throughput": 900347.45, "total_tokens": 451379200} {"current_steps": 55200, "total_steps": 93654, "loss": 0.9695, "learning_rate": 1.84052914232544e-05, "epoch": 1.7682106477032482, "percentage": 58.94, "elapsed_time": "0:16:58", "remaining_time": "0:11:49", "throughput": 444202.22, "total_tokens": 452198400} {"current_steps": 55300, "total_steps": 93654, "loss": 0.8756, "learning_rate": 1.8323565093795576e-05, "epoch": 1.7714139278621308, "percentage": 59.05, "elapsed_time": "0:26:21", "remaining_time": "0:18:16", "throughput": 286519.41, "total_tokens": 453017600} {"current_steps": 55400, "total_steps": 93654, "loss": 0.8884, "learning_rate": 1.824191552091431e-05, "epoch": 1.7746172080210134, "percentage": 59.15, "elapsed_time": "0:35:33", "remaining_time": "0:24:32", "throughput": 212750.8, "total_tokens": 453836800} {"current_steps": 55500, "total_steps": 93654, "loss": 0.901, "learning_rate": 1.8160343643306467e-05, "epoch": 1.7778204881798962, "percentage": 59.26, "elapsed_time": "0:49:09", "remaining_time": "0:33:47", "throughput": 154169.03, "total_tokens": 454656000} {"current_steps": 55600, "total_steps": 93654, "loss": 0.8653, "learning_rate": 1.8078850398774666e-05, "epoch": 1.781023768338779, "percentage": 59.37, "elapsed_time": "1:00:42", "remaining_time": "0:41:33", "throughput": 125033.23, "total_tokens": 455475200} {"current_steps": 55700, "total_steps": 93654, "loss": 0.9307, "learning_rate": 1.7997436724217517e-05, "epoch": 1.7842270484976614, "percentage": 59.47, "elapsed_time": "1:13:56", "remaining_time": "0:50:22", "throughput": 102858.34, "total_tokens": 456294400} {"current_steps": 55800, "total_steps": 93654, "loss": 0.8938, "learning_rate": 1.7916103555618818e-05, "epoch": 1.7874303286565443, "percentage": 59.58, "elapsed_time": "1:21:38", "remaining_time": "0:55:23", "throughput": 93315.73, "total_tokens": 457113600} {"current_steps": 55900, "total_steps": 93654, "loss": 0.8622, "learning_rate": 1.7834851828036855e-05, "epoch": 1.790633608815427, "percentage": 59.69, "elapsed_time": "1:29:14", "remaining_time": "1:00:16", "throughput": 85521.53, "total_tokens": 457932800} {"current_steps": 56000, "total_steps": 93654, "loss": 0.9165, "learning_rate": 1.7753682475593587e-05, "epoch": 1.7938368889743097, "percentage": 59.79, "elapsed_time": "1:36:53", "remaining_time": "1:05:09", "throughput": 78907.05, "total_tokens": 458752000} {"current_steps": 56100, "total_steps": 93654, "loss": 0.9159, "learning_rate": 1.7672596431463963e-05, "epoch": 1.7970401691331923, "percentage": 59.9, "elapsed_time": "1:44:46", "remaining_time": "1:10:08", "throughput": 73103.73, "total_tokens": 459571200} {"current_steps": 56200, "total_steps": 93654, "loss": 0.928, "learning_rate": 1.7591594627865134e-05, "epoch": 1.8002434492920751, "percentage": 60.01, "elapsed_time": "1:52:35", "remaining_time": "1:15:02", "throughput": 68148.07, "total_tokens": 460390400} {"current_steps": 56300, "total_steps": 93654, "loss": 0.8891, "learning_rate": 1.7510677996045787e-05, "epoch": 1.8034467294509577, "percentage": 60.11, "elapsed_time": "2:01:17", "remaining_time": "1:20:28", "throughput": 63375.57, "total_tokens": 461209600} {"current_steps": 56400, "total_steps": 93654, "loss": 0.9163, "learning_rate": 1.7429847466275424e-05, "epoch": 1.8066500096098403, "percentage": 60.22, "elapsed_time": "2:10:15", "remaining_time": "1:26:02", "throughput": 59115.57, "total_tokens": 462028800} {"current_steps": 56500, "total_steps": 93654, "loss": 0.9401, "learning_rate": 1.734910396783364e-05, "epoch": 1.8098532897687232, "percentage": 60.33, "elapsed_time": "2:18:34", "remaining_time": "1:31:07", "throughput": 55665.57, "total_tokens": 462848000} {"current_steps": 56600, "total_steps": 93654, "loss": 0.9391, "learning_rate": 1.7268448428999508e-05, "epoch": 1.813056569927606, "percentage": 60.44, "elapsed_time": "2:26:34", "remaining_time": "1:35:57", "throughput": 52723.73, "total_tokens": 463667200} {"current_steps": 56700, "total_steps": 93654, "loss": 0.8751, "learning_rate": 1.71878817770408e-05, "epoch": 1.8162598500864886, "percentage": 60.54, "elapsed_time": "2:34:26", "remaining_time": "1:40:39", "throughput": 50124.82, "total_tokens": 464486400} {"current_steps": 56800, "total_steps": 93654, "loss": 0.9578, "learning_rate": 1.7107404938203422e-05, "epoch": 1.8194631302453712, "percentage": 60.65, "elapsed_time": "2:42:22", "remaining_time": "1:45:21", "throughput": 47759.48, "total_tokens": 465305600} {"current_steps": 56900, "total_steps": 93654, "loss": 0.9462, "learning_rate": 1.702701883770074e-05, "epoch": 1.822666410404254, "percentage": 60.76, "elapsed_time": "2:50:17", "remaining_time": "1:50:00", "throughput": 45619.24, "total_tokens": 466124800} {"current_steps": 57000, "total_steps": 93654, "loss": 0.8676, "learning_rate": 1.6946724399702905e-05, "epoch": 1.8258696905631366, "percentage": 60.86, "elapsed_time": "2:58:19", "remaining_time": "1:54:40", "throughput": 43641.58, "total_tokens": 466944000} {"current_steps": 57100, "total_steps": 93654, "loss": 0.9282, "learning_rate": 1.6866522547326292e-05, "epoch": 1.8290729707220192, "percentage": 60.97, "elapsed_time": "3:06:12", "remaining_time": "1:59:12", "throughput": 41867.33, "total_tokens": 467763200} {"current_steps": 57200, "total_steps": 93654, "loss": 0.8611, "learning_rate": 1.6786414202622818e-05, "epoch": 1.832276250880902, "percentage": 61.08, "elapsed_time": "3:14:40", "remaining_time": "2:04:04", "throughput": 40115.19, "total_tokens": 468582400} {"current_steps": 57300, "total_steps": 93654, "loss": 0.8977, "learning_rate": 1.670640028656939e-05, "epoch": 1.835479531039785, "percentage": 61.18, "elapsed_time": "3:24:06", "remaining_time": "2:09:29", "throughput": 38329.57, "total_tokens": 469401600} {"current_steps": 57400, "total_steps": 93654, "loss": 0.9157, "learning_rate": 1.662648171905731e-05, "epoch": 1.8386828111986673, "percentage": 61.29, "elapsed_time": "3:33:30", "remaining_time": "2:14:51", "throughput": 36705.7, "total_tokens": 470220800} {"current_steps": 57500, "total_steps": 93654, "loss": 0.8808, "learning_rate": 1.654665941888169e-05, "epoch": 1.84188609135755, "percentage": 61.4, "elapsed_time": "3:42:58", "remaining_time": "2:20:11", "throughput": 35209.65, "total_tokens": 471040000} {"current_steps": 57600, "total_steps": 93654, "loss": 0.9322, "learning_rate": 1.6466934303730866e-05, "epoch": 1.845089371516433, "percentage": 61.5, "elapsed_time": "3:51:23", "remaining_time": "2:24:50", "throughput": 33986.7, "total_tokens": 471859200} {"current_steps": 57700, "total_steps": 93654, "loss": 0.9141, "learning_rate": 1.6387307290175914e-05, "epoch": 1.8482926516753155, "percentage": 61.61, "elapsed_time": "3:59:19", "remaining_time": "2:29:07", "throughput": 32917.34, "total_tokens": 472678400} {"current_steps": 57800, "total_steps": 93654, "loss": 0.8777, "learning_rate": 1.6307779293660034e-05, "epoch": 1.8514959318341981, "percentage": 61.72, "elapsed_time": "4:07:20", "remaining_time": "2:33:25", "throughput": 31905.58, "total_tokens": 473497600} {"current_steps": 57900, "total_steps": 93654, "loss": 0.8596, "learning_rate": 1.622835122848809e-05, "epoch": 1.854699211993081, "percentage": 61.82, "elapsed_time": "4:15:22", "remaining_time": "2:37:41", "throughput": 30956.4, "total_tokens": 474316800} {"current_steps": 58000, "total_steps": 93654, "loss": 0.9112, "learning_rate": 1.6149024007816067e-05, "epoch": 1.8579024921519636, "percentage": 61.93, "elapsed_time": "4:23:30", "remaining_time": "2:41:59", "throughput": 30051.16, "total_tokens": 475136000} {"current_steps": 58100, "total_steps": 93654, "loss": 0.9514, "learning_rate": 1.6069798543640543e-05, "epoch": 1.8611057723108462, "percentage": 62.04, "elapsed_time": "4:31:30", "remaining_time": "2:46:08", "throughput": 29216.88, "total_tokens": 475955200} {"current_steps": 58200, "total_steps": 93654, "loss": 0.8633, "learning_rate": 1.599067574678829e-05, "epoch": 1.864309052469729, "percentage": 62.14, "elapsed_time": "4:39:24", "remaining_time": "2:50:12", "throughput": 28440.19, "total_tokens": 476774400} {"current_steps": 58300, "total_steps": 93654, "loss": 0.8828, "learning_rate": 1.591165652690571e-05, "epoch": 1.8675123326286118, "percentage": 62.25, "elapsed_time": "4:47:35", "remaining_time": "2:54:23", "throughput": 27677.9, "total_tokens": 477593600} {"current_steps": 58400, "total_steps": 93654, "loss": 0.8529, "learning_rate": 1.5832741792448447e-05, "epoch": 1.8707156127874944, "percentage": 62.36, "elapsed_time": "4:55:22", "remaining_time": "2:58:18", "throughput": 26995.25, "total_tokens": 478412800} {"current_steps": 58500, "total_steps": 93654, "loss": 0.8634, "learning_rate": 1.5753932450670892e-05, "epoch": 1.873918892946377, "percentage": 62.46, "elapsed_time": "5:03:00", "remaining_time": "3:02:04", "throughput": 26360.12, "total_tokens": 479232000} {"current_steps": 58600, "total_steps": 93654, "loss": 0.8692, "learning_rate": 1.5675229407615773e-05, "epoch": 1.8771221731052599, "percentage": 62.57, "elapsed_time": "5:10:37", "remaining_time": "3:05:48", "throughput": 25757.12, "total_tokens": 480051200} {"current_steps": 58700, "total_steps": 93654, "loss": 0.8899, "learning_rate": 1.5596633568103764e-05, "epoch": 1.8803254532641425, "percentage": 62.68, "elapsed_time": "5:18:14", "remaining_time": "3:09:29", "throughput": 25184.28, "total_tokens": 480870400} {"current_steps": 58800, "total_steps": 93654, "loss": 0.9001, "learning_rate": 1.5518145835723034e-05, "epoch": 1.883528733423025, "percentage": 62.78, "elapsed_time": "5:25:51", "remaining_time": "3:13:09", "throughput": 24636.73, "total_tokens": 481689600} {"current_steps": 58100, "total_steps": 93654, "loss": 0.9513, "learning_rate": 1.6069798543640543e-05, "epoch": 1.8611057723108462, "percentage": 62.04, "elapsed_time": "0:08:04", "remaining_time": "0:04:56", "throughput": 981633.3, "total_tokens": 475955200} {"current_steps": 58200, "total_steps": 93654, "loss": 0.8633, "learning_rate": 1.599067574678829e-05, "epoch": 1.864309052469729, "percentage": 62.14, "elapsed_time": "0:23:51", "remaining_time": "0:14:32", "throughput": 332980.23, "total_tokens": 476774400} {"current_steps": 58300, "total_steps": 93654, "loss": 0.8829, "learning_rate": 1.591165652690571e-05, "epoch": 1.8675123326286118, "percentage": 62.25, "elapsed_time": "0:36:23", "remaining_time": "0:22:04", "throughput": 218745.11, "total_tokens": 477593600} {"current_steps": 58400, "total_steps": 93654, "loss": 0.853, "learning_rate": 1.5832741792448447e-05, "epoch": 1.8707156127874944, "percentage": 62.36, "elapsed_time": "0:45:44", "remaining_time": "0:27:36", "throughput": 174310.56, "total_tokens": 478412800} {"current_steps": 58500, "total_steps": 93654, "loss": 0.8632, "learning_rate": 1.5753932450670892e-05, "epoch": 1.873918892946377, "percentage": 62.46, "elapsed_time": "0:55:29", "remaining_time": "0:33:20", "throughput": 143937.79, "total_tokens": 479232000} {"current_steps": 58600, "total_steps": 93654, "loss": 0.8691, "learning_rate": 1.5675229407615773e-05, "epoch": 1.8771221731052599, "percentage": 62.57, "elapsed_time": "1:03:58", "remaining_time": "0:38:15", "throughput": 125072.06, "total_tokens": 480051200} {"current_steps": 58700, "total_steps": 93654, "loss": 0.8898, "learning_rate": 1.5596633568103764e-05, "epoch": 1.8803254532641425, "percentage": 62.68, "elapsed_time": "1:12:40", "remaining_time": "0:43:16", "throughput": 110271.99, "total_tokens": 480870400} {"current_steps": 58800, "total_steps": 93654, "loss": 0.9001, "learning_rate": 1.5518145835723034e-05, "epoch": 1.883528733423025, "percentage": 62.78, "elapsed_time": "1:21:31", "remaining_time": "0:48:19", "throughput": 98484.26, "total_tokens": 481689600} {"current_steps": 58900, "total_steps": 93654, "loss": 0.8988, "learning_rate": 1.54397671128189e-05, "epoch": 1.886732013581908, "percentage": 62.89, "elapsed_time": "1:30:09", "remaining_time": "0:53:11", "throughput": 89196.8, "total_tokens": 482508800} {"current_steps": 59000, "total_steps": 93654, "loss": 0.8744, "learning_rate": 1.5361498300483423e-05, "epoch": 1.8899352937407907, "percentage": 63.0, "elapsed_time": "1:37:47", "remaining_time": "0:57:26", "throughput": 82375.11, "total_tokens": 483328000} {"current_steps": 59100, "total_steps": 93654, "loss": 0.919, "learning_rate": 1.5283340298545056e-05, "epoch": 1.893138573899673, "percentage": 63.1, "elapsed_time": "1:45:41", "remaining_time": "1:01:47", "throughput": 76344.1, "total_tokens": 484147200} {"current_steps": 59200, "total_steps": 93654, "loss": 0.9134, "learning_rate": 1.5205294005558335e-05, "epoch": 1.896341854058556, "percentage": 63.21, "elapsed_time": "1:54:06", "remaining_time": "1:06:24", "throughput": 70837.49, "total_tokens": 484966400} {"current_steps": 59300, "total_steps": 93654, "loss": 0.8912, "learning_rate": 1.5127360318793481e-05, "epoch": 1.8995451342174388, "percentage": 63.32, "elapsed_time": "2:02:04", "remaining_time": "1:10:43", "throughput": 66319.53, "total_tokens": 485785600} {"current_steps": 59400, "total_steps": 93654, "loss": 0.8857, "learning_rate": 1.5049540134226158e-05, "epoch": 1.9027484143763214, "percentage": 63.42, "elapsed_time": "2:10:11", "remaining_time": "1:15:04", "throughput": 62290.06, "total_tokens": 486604800} {"current_steps": 59500, "total_steps": 93654, "loss": 0.9104, "learning_rate": 1.4971834346527102e-05, "epoch": 1.905951694535204, "percentage": 63.53, "elapsed_time": "2:17:57", "remaining_time": "1:19:11", "throughput": 58883.42, "total_tokens": 487424000} {"current_steps": 59600, "total_steps": 93654, "loss": 0.8938, "learning_rate": 1.4894243849051889e-05, "epoch": 1.9091549746940868, "percentage": 63.64, "elapsed_time": "2:25:33", "remaining_time": "1:23:10", "throughput": 55902.86, "total_tokens": 488243200} {"current_steps": 59700, "total_steps": 93654, "loss": 0.9233, "learning_rate": 1.4816769533830638e-05, "epoch": 1.9123582548529694, "percentage": 63.75, "elapsed_time": "2:33:10", "remaining_time": "1:27:07", "throughput": 53211.75, "total_tokens": 489062400} {"current_steps": 59100, "total_steps": 93654, "loss": 0.9189, "learning_rate": 1.5283340298545056e-05, "epoch": 1.893138573899673, "percentage": 63.1, "elapsed_time": "0:07:47", "remaining_time": "0:04:33", "throughput": 1034790.88, "total_tokens": 484147200} {"current_steps": 59200, "total_steps": 93654, "loss": 0.9133, "learning_rate": 1.5205294005558335e-05, "epoch": 1.896341854058556, "percentage": 63.21, "elapsed_time": "0:15:28", "remaining_time": "0:09:00", "throughput": 522513.74, "total_tokens": 484966400} {"current_steps": 59300, "total_steps": 93654, "loss": 0.8913, "learning_rate": 1.5127360318793481e-05, "epoch": 1.8995451342174388, "percentage": 63.32, "elapsed_time": "0:23:06", "remaining_time": "0:13:23", "throughput": 350402.9, "total_tokens": 485785600} {"current_steps": 59400, "total_steps": 93654, "loss": 0.8857, "learning_rate": 1.5049540134226158e-05, "epoch": 1.9027484143763214, "percentage": 63.42, "elapsed_time": "0:30:45", "remaining_time": "0:17:44", "throughput": 263658.71, "total_tokens": 486604800} {"current_steps": 59500, "total_steps": 93654, "loss": 0.9104, "learning_rate": 1.4971834346527102e-05, "epoch": 1.905951694535204, "percentage": 63.53, "elapsed_time": "0:38:24", "remaining_time": "0:22:02", "throughput": 211510.95, "total_tokens": 487424000} {"current_steps": 59600, "total_steps": 93654, "loss": 0.8936, "learning_rate": 1.4894243849051889e-05, "epoch": 1.9091549746940868, "percentage": 63.64, "elapsed_time": "0:46:01", "remaining_time": "0:26:17", "throughput": 176815.49, "total_tokens": 488243200} {"current_steps": 59700, "total_steps": 93654, "loss": 0.9233, "learning_rate": 1.4816769533830638e-05, "epoch": 1.9123582548529694, "percentage": 63.75, "elapsed_time": "0:53:39", "remaining_time": "0:30:30", "throughput": 151914.04, "total_tokens": 489062400} {"current_steps": 59800, "total_steps": 93654, "loss": 0.893, "learning_rate": 1.4739412291557774e-05, "epoch": 1.915561535011852, "percentage": 63.85, "elapsed_time": "1:01:15", "remaining_time": "0:34:40", "throughput": 133296.65, "total_tokens": 489881600} {"current_steps": 59900, "total_steps": 93654, "loss": 0.8643, "learning_rate": 1.4662173011581757e-05, "epoch": 1.9187648151707348, "percentage": 63.96, "elapsed_time": "1:08:51", "remaining_time": "0:38:48", "throughput": 118763.91, "total_tokens": 490700800} {"current_steps": 60000, "total_steps": 93654, "loss": 0.9376, "learning_rate": 1.4585052581894881e-05, "epoch": 1.9219680953296177, "percentage": 64.07, "elapsed_time": "1:16:30", "remaining_time": "0:42:54", "throughput": 107077.4, "total_tokens": 491520000} {"current_steps": 60100, "total_steps": 93654, "loss": 0.9354, "learning_rate": 1.4508051889123075e-05, "epoch": 1.9251713754885003, "percentage": 64.17, "elapsed_time": "1:24:13", "remaining_time": "0:47:01", "throughput": 97430.33, "total_tokens": 492339200} {"current_steps": 60200, "total_steps": 93654, "loss": 0.8201, "learning_rate": 1.4431171818515698e-05, "epoch": 1.9283746556473829, "percentage": 64.28, "elapsed_time": "1:31:50", "remaining_time": "0:51:02", "throughput": 89495.83, "total_tokens": 493158400} {"current_steps": 60300, "total_steps": 93654, "loss": 0.8322, "learning_rate": 1.4354413253935336e-05, "epoch": 1.9315779358062657, "percentage": 64.39, "elapsed_time": "1:39:27", "remaining_time": "0:55:00", "throughput": 82778.16, "total_tokens": 493977600} {"current_steps": 60400, "total_steps": 93654, "loss": 0.9181, "learning_rate": 1.4277777077847665e-05, "epoch": 1.9347812159651483, "percentage": 64.49, "elapsed_time": "1:47:03", "remaining_time": "0:58:56", "throughput": 77032.88, "total_tokens": 494796800} {"current_steps": 60500, "total_steps": 93654, "loss": 0.8783, "learning_rate": 1.420126417131133e-05, "epoch": 1.937984496124031, "percentage": 64.6, "elapsed_time": "1:54:39", "remaining_time": "1:02:49", "throughput": 72046.22, "total_tokens": 495616000} {"current_steps": 60600, "total_steps": 93654, "loss": 0.9239, "learning_rate": 1.4124875413967767e-05, "epoch": 1.9411877762829137, "percentage": 64.71, "elapsed_time": "2:02:17", "remaining_time": "1:06:42", "throughput": 67657.59, "total_tokens": 496435200} {"current_steps": 60700, "total_steps": 93654, "loss": 0.8908, "learning_rate": 1.4048611684031138e-05, "epoch": 1.9443910564417966, "percentage": 64.81, "elapsed_time": "2:09:54", "remaining_time": "1:10:31", "throughput": 63793.65, "total_tokens": 497254400} {"current_steps": 60800, "total_steps": 93654, "loss": 0.8845, "learning_rate": 1.3972473858278184e-05, "epoch": 1.947594336600679, "percentage": 64.92, "elapsed_time": "2:17:33", "remaining_time": "1:14:19", "throughput": 60349.75, "total_tokens": 498073600} {"current_steps": 60900, "total_steps": 93654, "loss": 0.8902, "learning_rate": 1.3896462812038168e-05, "epoch": 1.9507976167595618, "percentage": 65.03, "elapsed_time": "2:25:11", "remaining_time": "1:18:05", "throughput": 57270.54, "total_tokens": 498892800} {"current_steps": 61000, "total_steps": 93654, "loss": 0.9283, "learning_rate": 1.3820579419182838e-05, "epoch": 1.9540008969184446, "percentage": 65.13, "elapsed_time": "2:32:50", "remaining_time": "1:21:49", "throughput": 54490.93, "total_tokens": 499712000} {"current_steps": 61100, "total_steps": 93654, "loss": 0.9166, "learning_rate": 1.3744824552116343e-05, "epoch": 1.9572041770773272, "percentage": 65.24, "elapsed_time": "2:40:37", "remaining_time": "1:25:34", "throughput": 51936.63, "total_tokens": 500531200} {"current_steps": 61200, "total_steps": 93654, "loss": 0.9069, "learning_rate": 1.3669199081765232e-05, "epoch": 1.9604074572362098, "percentage": 65.35, "elapsed_time": "2:48:14", "remaining_time": "1:29:12", "throughput": 49667.07, "total_tokens": 501350400} {"current_steps": 61300, "total_steps": 93654, "loss": 0.9138, "learning_rate": 1.3593703877568407e-05, "epoch": 1.9636107373950926, "percentage": 65.45, "elapsed_time": "2:55:54", "remaining_time": "1:32:50", "throughput": 47580.86, "total_tokens": 502169600} {"current_steps": 61400, "total_steps": 93654, "loss": 0.8311, "learning_rate": 1.3518339807467138e-05, "epoch": 1.9668140175539752, "percentage": 65.56, "elapsed_time": "3:03:30", "remaining_time": "1:36:24", "throughput": 45681.77, "total_tokens": 502988800} {"current_steps": 61500, "total_steps": 93654, "loss": 0.9508, "learning_rate": 1.3443107737895121e-05, "epoch": 1.9700172977128578, "percentage": 65.67, "elapsed_time": "3:11:10", "remaining_time": "1:39:57", "throughput": 43921.34, "total_tokens": 503808000} {"current_steps": 61600, "total_steps": 93654, "loss": 0.8986, "learning_rate": 1.3368008533768478e-05, "epoch": 1.9732205778717407, "percentage": 65.77, "elapsed_time": "3:18:48", "remaining_time": "1:43:26", "throughput": 42305.94, "total_tokens": 504627200} {"current_steps": 61700, "total_steps": 93654, "loss": 0.8775, "learning_rate": 1.3293043058475835e-05, "epoch": 1.9764238580306235, "percentage": 65.88, "elapsed_time": "3:26:25", "remaining_time": "1:46:54", "throughput": 40807.93, "total_tokens": 505446400} {"current_steps": 61800, "total_steps": 93654, "loss": 0.8588, "learning_rate": 1.321821217386836e-05, "epoch": 1.979627138189506, "percentage": 65.99, "elapsed_time": "3:34:05", "remaining_time": "1:50:20", "throughput": 39412.95, "total_tokens": 506265600} {"current_steps": 61900, "total_steps": 93654, "loss": 0.9, "learning_rate": 1.314351674024989e-05, "epoch": 1.9828304183483887, "percentage": 66.09, "elapsed_time": "3:41:45", "remaining_time": "1:53:45", "throughput": 38111.94, "total_tokens": 507084800} {"current_steps": 62000, "total_steps": 93654, "loss": 0.8931, "learning_rate": 1.3068957616367045e-05, "epoch": 1.9860336985072715, "percentage": 66.2, "elapsed_time": "3:49:22", "remaining_time": "1:57:06", "throughput": 36904.59, "total_tokens": 507904000} {"current_steps": 62100, "total_steps": 93654, "loss": 0.9254, "learning_rate": 1.2994535659399327e-05, "epoch": 1.9892369786661541, "percentage": 66.31, "elapsed_time": "3:57:03", "remaining_time": "2:00:27", "throughput": 35766.81, "total_tokens": 508723200} {"current_steps": 62200, "total_steps": 93654, "loss": 0.8628, "learning_rate": 1.2920251724949296e-05, "epoch": 1.9924402588250367, "percentage": 66.41, "elapsed_time": "4:04:43", "remaining_time": "2:03:45", "throughput": 34702.34, "total_tokens": 509542400} {"current_steps": 62300, "total_steps": 93654, "loss": 0.8509, "learning_rate": 1.2846106667032693e-05, "epoch": 1.9956435389839196, "percentage": 66.52, "elapsed_time": "4:12:21", "remaining_time": "2:07:00", "throughput": 33706.57, "total_tokens": 510361600} {"current_steps": 62400, "total_steps": 93654, "loss": 0.8547, "learning_rate": 1.2772101338068649e-05, "epoch": 1.9988468191428024, "percentage": 66.63, "elapsed_time": "4:19:59", "remaining_time": "2:10:13", "throughput": 32769.73, "total_tokens": 511180800} {"current_steps": 62500, "total_steps": 93654, "loss": 0.8274, "learning_rate": 1.2698236588869894e-05, "epoch": 2.0020500993016848, "percentage": 66.74, "elapsed_time": "4:27:37", "remaining_time": "2:13:23", "throughput": 31886.07, "total_tokens": 512000000} {"current_steps": 62600, "total_steps": 93654, "loss": 0.8213, "learning_rate": 1.2624513268632967e-05, "epoch": 2.0052533794605676, "percentage": 66.84, "elapsed_time": "4:35:13", "remaining_time": "2:16:32", "throughput": 31053.74, "total_tokens": 512819200} {"current_steps": 62700, "total_steps": 93654, "loss": 0.8608, "learning_rate": 1.2550932224928425e-05, "epoch": 2.0084566596194504, "percentage": 66.95, "elapsed_time": "4:42:52", "remaining_time": "2:19:39", "throughput": 30262.44, "total_tokens": 513638400} {"current_steps": 62800, "total_steps": 93654, "loss": 0.836, "learning_rate": 1.2477494303691157e-05, "epoch": 2.011659939778333, "percentage": 67.06, "elapsed_time": "4:50:32", "remaining_time": "2:22:44", "throughput": 29510.86, "total_tokens": 514457600} {"current_steps": 62900, "total_steps": 93654, "loss": 0.8208, "learning_rate": 1.2404200349210577e-05, "epoch": 2.0148632199372156, "percentage": 67.16, "elapsed_time": "4:58:10", "remaining_time": "2:25:47", "throughput": 28801.03, "total_tokens": 515276800} {"current_steps": 63000, "total_steps": 93654, "loss": 0.8293, "learning_rate": 1.2331051204121009e-05, "epoch": 2.0180665000960984, "percentage": 67.27, "elapsed_time": "5:05:48", "remaining_time": "2:28:47", "throughput": 28127.94, "total_tokens": 516096000} {"current_steps": 63100, "total_steps": 93654, "loss": 0.8663, "learning_rate": 1.2258047709391945e-05, "epoch": 2.0212697802549813, "percentage": 67.38, "elapsed_time": "5:13:28", "remaining_time": "2:31:47", "throughput": 27482.46, "total_tokens": 516915200} {"current_steps": 63200, "total_steps": 93654, "loss": 0.8186, "learning_rate": 1.218519070431836e-05, "epoch": 2.0244730604138637, "percentage": 67.48, "elapsed_time": "5:21:07", "remaining_time": "2:34:44", "throughput": 26870.35, "total_tokens": 517734400} {"current_steps": 63300, "total_steps": 93654, "loss": 0.8468, "learning_rate": 1.2112481026511138e-05, "epoch": 2.0276763405727465, "percentage": 67.59, "elapsed_time": "5:28:45", "remaining_time": "2:37:39", "throughput": 26288.13, "total_tokens": 518553600} {"current_steps": 63400, "total_steps": 93654, "loss": 0.7955, "learning_rate": 1.2039919511887338e-05, "epoch": 2.0308796207316293, "percentage": 67.7, "elapsed_time": "5:36:24", "remaining_time": "2:40:32", "throughput": 25730.89, "total_tokens": 519372800} {"current_steps": 63500, "total_steps": 93654, "loss": 0.8313, "learning_rate": 1.1967506994660685e-05, "epoch": 2.0340829008905117, "percentage": 67.8, "elapsed_time": "5:44:02", "remaining_time": "2:43:22", "throughput": 25200.54, "total_tokens": 520192000} {"current_steps": 63600, "total_steps": 93654, "loss": 0.8387, "learning_rate": 1.1895244307331923e-05, "epoch": 2.0372861810493945, "percentage": 67.91, "elapsed_time": "5:51:41", "remaining_time": "2:46:11", "throughput": 24691.25, "total_tokens": 521011200} {"current_steps": 63700, "total_steps": 93654, "loss": 0.8087, "learning_rate": 1.1823132280679235e-05, "epoch": 2.0404894612082773, "percentage": 68.02, "elapsed_time": "5:59:20", "remaining_time": "2:48:58", "throughput": 24202.97, "total_tokens": 521830400} {"current_steps": 63800, "total_steps": 93654, "loss": 0.8357, "learning_rate": 1.1751171743748737e-05, "epoch": 2.04369274136716, "percentage": 68.12, "elapsed_time": "6:06:57", "remaining_time": "2:51:42", "throughput": 23737.76, "total_tokens": 522649600} {"current_steps": 63900, "total_steps": 93654, "loss": 0.8435, "learning_rate": 1.1679363523844918e-05, "epoch": 2.0468960215260426, "percentage": 68.23, "elapsed_time": "6:14:36", "remaining_time": "2:54:25", "throughput": 23289.21, "total_tokens": 523468800} {"current_steps": 64000, "total_steps": 93654, "loss": 0.8702, "learning_rate": 1.1607708446521125e-05, "epoch": 2.0500993016849254, "percentage": 68.34, "elapsed_time": "6:22:14", "remaining_time": "2:57:06", "throughput": 22860.53, "total_tokens": 524288000} {"current_steps": 64100, "total_steps": 93654, "loss": 0.8436, "learning_rate": 1.153620733557007e-05, "epoch": 2.053302581843808, "percentage": 68.44, "elapsed_time": "6:29:53", "remaining_time": "2:59:45", "throughput": 22446.97, "total_tokens": 525107200} {"current_steps": 64200, "total_steps": 93654, "loss": 0.8249, "learning_rate": 1.1464861013014391e-05, "epoch": 2.0565058620026906, "percentage": 68.55, "elapsed_time": "6:37:31", "remaining_time": "3:02:22", "throughput": 22049.67, "total_tokens": 525926400} {"current_steps": 64300, "total_steps": 93654, "loss": 0.8469, "learning_rate": 1.139367029909717e-05, "epoch": 2.0597091421615734, "percentage": 68.66, "elapsed_time": "6:45:11", "remaining_time": "3:04:58", "throughput": 21666.43, "total_tokens": 526745600} {"current_steps": 64400, "total_steps": 93654, "loss": 0.8396, "learning_rate": 1.1322636012272517e-05, "epoch": 2.0629124223204562, "percentage": 68.76, "elapsed_time": "6:52:50", "remaining_time": "3:07:32", "throughput": 21298.29, "total_tokens": 527564800} {"current_steps": 64500, "total_steps": 93654, "loss": 0.7899, "learning_rate": 1.1251758969196147e-05, "epoch": 2.0661157024793386, "percentage": 68.87, "elapsed_time": "7:00:27", "remaining_time": "3:10:02", "throughput": 20944.69, "total_tokens": 528384000} {"current_steps": 64600, "total_steps": 93654, "loss": 0.8451, "learning_rate": 1.1181039984715991e-05, "epoch": 2.0693189826382214, "percentage": 68.98, "elapsed_time": "7:08:05", "remaining_time": "3:12:31", "throughput": 20603.52, "total_tokens": 529203200} {"current_steps": 64700, "total_steps": 93654, "loss": 0.7879, "learning_rate": 1.1110479871862862e-05, "epoch": 2.0725222627971043, "percentage": 69.08, "elapsed_time": "7:15:42", "remaining_time": "3:14:59", "throughput": 20273.99, "total_tokens": 530022400} {"current_steps": 64800, "total_steps": 93654, "loss": 0.866, "learning_rate": 1.1040079441841065e-05, "epoch": 2.075725542955987, "percentage": 69.19, "elapsed_time": "7:23:20", "remaining_time": "3:17:24", "throughput": 19956.38, "total_tokens": 530841600} {"current_steps": 64100, "total_steps": 93654, "loss": 0.8436, "learning_rate": 1.153620733557007e-05, "epoch": 2.053302581843808, "percentage": 68.44, "elapsed_time": "0:07:47", "remaining_time": "0:03:35", "throughput": 1123293.64, "total_tokens": 525107200} {"current_steps": 64200, "total_steps": 93654, "loss": 0.825, "learning_rate": 1.1464861013014391e-05, "epoch": 2.0565058620026906, "percentage": 68.55, "elapsed_time": "0:15:26", "remaining_time": "0:07:05", "throughput": 567732.07, "total_tokens": 525926400} {"current_steps": 64300, "total_steps": 93654, "loss": 0.8469, "learning_rate": 1.139367029909717e-05, "epoch": 2.0597091421615734, "percentage": 68.66, "elapsed_time": "0:23:06", "remaining_time": "0:10:32", "throughput": 379976.45, "total_tokens": 526745600} {"current_steps": 64400, "total_steps": 93654, "loss": 0.8397, "learning_rate": 1.1322636012272517e-05, "epoch": 2.0629124223204562, "percentage": 68.76, "elapsed_time": "0:30:44", "remaining_time": "0:13:57", "throughput": 285980.84, "total_tokens": 527564800} {"current_steps": 64500, "total_steps": 93654, "loss": 0.7898, "learning_rate": 1.1251758969196147e-05, "epoch": 2.0661157024793386, "percentage": 68.87, "elapsed_time": "0:38:22", "remaining_time": "0:17:20", "throughput": 229438.9, "total_tokens": 528384000} {"current_steps": 64600, "total_steps": 93654, "loss": 0.8449, "learning_rate": 1.1181039984715991e-05, "epoch": 2.0693189826382214, "percentage": 68.98, "elapsed_time": "0:46:01", "remaining_time": "0:20:42", "throughput": 191627.57, "total_tokens": 529203200} {"current_steps": 64700, "total_steps": 93654, "loss": 0.7879, "learning_rate": 1.1110479871862862e-05, "epoch": 2.0725222627971043, "percentage": 69.08, "elapsed_time": "0:53:40", "remaining_time": "0:24:01", "throughput": 164600.59, "total_tokens": 530022400} {"current_steps": 64800, "total_steps": 93654, "loss": 0.866, "learning_rate": 1.1040079441841065e-05, "epoch": 2.075725542955987, "percentage": 69.19, "elapsed_time": "1:01:18", "remaining_time": "0:27:17", "throughput": 144315.84, "total_tokens": 530841600} {"current_steps": 64900, "total_steps": 93654, "loss": 0.851, "learning_rate": 1.0969839504019108e-05, "epoch": 2.0789288231148695, "percentage": 69.3, "elapsed_time": "1:08:58", "remaining_time": "0:30:33", "throughput": 128452.98, "total_tokens": 531660800} {"current_steps": 65000, "total_steps": 93654, "loss": 0.814, "learning_rate": 1.0899760865920355e-05, "epoch": 2.0821321032737523, "percentage": 69.4, "elapsed_time": "1:17:11", "remaining_time": "0:34:01", "throughput": 114969.83, "total_tokens": 532480000} {"current_steps": 65100, "total_steps": 93654, "loss": 0.8307, "learning_rate": 1.0829844333213766e-05, "epoch": 2.085335383432635, "percentage": 69.51, "elapsed_time": "1:26:35", "remaining_time": "0:37:58", "throughput": 102655.19, "total_tokens": 533299200} {"current_steps": 65200, "total_steps": 93654, "loss": 0.8406, "learning_rate": 1.0760090709704642e-05, "epoch": 2.0885386635915175, "percentage": 69.62, "elapsed_time": "1:46:29", "remaining_time": "0:46:28", "throughput": 83587.19, "total_tokens": 534118400} {"current_steps": 65300, "total_steps": 93654, "loss": 0.8263, "learning_rate": 1.0690500797325387e-05, "epoch": 2.0917419437504003, "percentage": 69.72, "elapsed_time": "2:21:17", "remaining_time": "1:01:20", "throughput": 63101.69, "total_tokens": 534937600} {"current_steps": 65400, "total_steps": 93654, "loss": 0.7959, "learning_rate": 1.0621075396126265e-05, "epoch": 2.094945223909283, "percentage": 69.83, "elapsed_time": "2:53:50", "remaining_time": "1:15:06", "throughput": 51365.3, "total_tokens": 535756800} {"current_steps": 65500, "total_steps": 93654, "loss": 0.8417, "learning_rate": 1.055181530426621e-05, "epoch": 2.098148504068166, "percentage": 69.94, "elapsed_time": "3:27:53", "remaining_time": "1:29:21", "throughput": 43018.58, "total_tokens": 536576000} {"current_steps": 65600, "total_steps": 93654, "loss": 0.8267, "learning_rate": 1.0482721318003644e-05, "epoch": 2.1013517842270484, "percentage": 70.05, "elapsed_time": "3:41:01", "remaining_time": "1:34:31", "throughput": 40523.03, "total_tokens": 537395200} {"current_steps": 65700, "total_steps": 93654, "loss": 0.811, "learning_rate": 1.0413794231687357e-05, "epoch": 2.104555064385931, "percentage": 70.15, "elapsed_time": "3:49:04", "remaining_time": "1:37:28", "throughput": 39157.53, "total_tokens": 538214400} {"current_steps": 65800, "total_steps": 93654, "loss": 0.8376, "learning_rate": 1.0345034837747342e-05, "epoch": 2.107758344544814, "percentage": 70.26, "elapsed_time": "3:57:14", "remaining_time": "1:40:25", "throughput": 37869.05, "total_tokens": 539033600} {"current_steps": 65900, "total_steps": 93654, "loss": 0.8641, "learning_rate": 1.0276443926685694e-05, "epoch": 2.1109616247036964, "percentage": 70.37, "elapsed_time": "4:05:27", "remaining_time": "1:43:22", "throughput": 36655.17, "total_tokens": 539852800} {"current_steps": 66000, "total_steps": 93654, "loss": 0.8445, "learning_rate": 1.0208022287067509e-05, "epoch": 2.1141649048625792, "percentage": 70.47, "elapsed_time": "4:13:36", "remaining_time": "1:46:15", "throughput": 35532.34, "total_tokens": 540672000} {"current_steps": 66100, "total_steps": 93654, "loss": 0.8783, "learning_rate": 1.0139770705511833e-05, "epoch": 2.117368185021462, "percentage": 70.58, "elapsed_time": "4:21:49", "remaining_time": "1:49:08", "throughput": 34468.78, "total_tokens": 541491200} {"current_steps": 66200, "total_steps": 93654, "loss": 0.7836, "learning_rate": 1.0071689966682623e-05, "epoch": 2.120571465180345, "percentage": 70.69, "elapsed_time": "4:30:00", "remaining_time": "1:51:58", "throughput": 33473.92, "total_tokens": 542310400} {"current_steps": 66300, "total_steps": 93654, "loss": 0.8143, "learning_rate": 1.0003780853279732e-05, "epoch": 2.1237747453392273, "percentage": 70.79, "elapsed_time": "4:38:04", "remaining_time": "1:54:43", "throughput": 32552.24, "total_tokens": 543129600} {"current_steps": 66400, "total_steps": 93654, "loss": 0.8582, "learning_rate": 9.936044146029855e-06, "epoch": 2.12697802549811, "percentage": 70.9, "elapsed_time": "4:46:01", "remaining_time": "1:57:23", "throughput": 31696.03, "total_tokens": 543948800} {"current_steps": 66500, "total_steps": 93654, "loss": 0.8295, "learning_rate": 9.868480623677643e-06, "epoch": 2.130181305656993, "percentage": 71.01, "elapsed_time": "4:54:02", "remaining_time": "2:00:04", "throughput": 30878.02, "total_tokens": 544768000} {"current_steps": 66600, "total_steps": 93654, "loss": 0.7856, "learning_rate": 9.801091062976665e-06, "epoch": 2.1333845858158753, "percentage": 71.11, "elapsed_time": "5:02:02", "remaining_time": "2:02:41", "throughput": 30105.26, "total_tokens": 545587200} {"current_steps": 66700, "total_steps": 93654, "loss": 0.8144, "learning_rate": 9.733876238680531e-06, "epoch": 2.136587865974758, "percentage": 71.22, "elapsed_time": "5:10:05", "remaining_time": "2:05:18", "throughput": 29368.54, "total_tokens": 546406400} {"current_steps": 66800, "total_steps": 93654, "loss": 0.7658, "learning_rate": 9.666836923533987e-06, "epoch": 2.139791146133641, "percentage": 71.33, "elapsed_time": "5:18:08", "remaining_time": "2:07:53", "throughput": 28668.17, "total_tokens": 547225600} {"current_steps": 66900, "total_steps": 93654, "loss": 0.7818, "learning_rate": 9.599973888263972e-06, "epoch": 2.1429944262925233, "percentage": 71.43, "elapsed_time": "5:26:11", "remaining_time": "2:10:26", "throughput": 28001.66, "total_tokens": 548044800} {"current_steps": 67000, "total_steps": 93654, "loss": 0.8259, "learning_rate": 9.533287901570843e-06, "epoch": 2.146197706451406, "percentage": 71.54, "elapsed_time": "5:34:18", "remaining_time": "2:12:59", "throughput": 27363.37, "total_tokens": 548864000} {"current_steps": 67100, "total_steps": 93654, "loss": 0.84, "learning_rate": 9.466779730119449e-06, "epoch": 2.149400986610289, "percentage": 71.65, "elapsed_time": "5:42:22", "remaining_time": "2:15:29", "throughput": 26758.01, "total_tokens": 549683200} {"current_steps": 67200, "total_steps": 93654, "loss": 0.8595, "learning_rate": 9.400450138530394e-06, "epoch": 2.152604266769172, "percentage": 71.75, "elapsed_time": "5:50:23", "remaining_time": "2:17:56", "throughput": 26184.75, "total_tokens": 550502400} {"current_steps": 67300, "total_steps": 93654, "loss": 0.8404, "learning_rate": 9.334299889371217e-06, "epoch": 2.155807546928054, "percentage": 71.86, "elapsed_time": "5:58:38", "remaining_time": "2:20:26", "throughput": 25620.31, "total_tokens": 551321600} {"current_steps": 67400, "total_steps": 93654, "loss": 0.7933, "learning_rate": 9.268329743147583e-06, "epoch": 2.159010827086937, "percentage": 71.97, "elapsed_time": "6:06:41", "remaining_time": "2:22:50", "throughput": 25095.92, "total_tokens": 552140800} {"current_steps": 67500, "total_steps": 93654, "loss": 0.8066, "learning_rate": 9.202540458294623e-06, "epoch": 2.16221410724582, "percentage": 72.07, "elapsed_time": "6:14:43", "remaining_time": "2:25:11", "throughput": 24594.39, "total_tokens": 552960000} {"current_steps": 67600, "total_steps": 93654, "loss": 0.8831, "learning_rate": 9.136932791168132e-06, "epoch": 2.1654173874047022, "percentage": 72.18, "elapsed_time": "6:22:56", "remaining_time": "2:27:35", "throughput": 24102.2, "total_tokens": 553779200} {"current_steps": 67700, "total_steps": 93654, "loss": 0.7602, "learning_rate": 9.071507496035943e-06, "epoch": 2.168620667563585, "percentage": 72.29, "elapsed_time": "6:30:58", "remaining_time": "2:29:53", "throughput": 23641.98, "total_tokens": 554598400} {"current_steps": 67800, "total_steps": 93654, "loss": 0.7984, "learning_rate": 9.006265325069197e-06, "epoch": 2.171823947722468, "percentage": 72.39, "elapsed_time": "6:38:40", "remaining_time": "2:32:01", "throughput": 23218.85, "total_tokens": 555417600} {"current_steps": 67900, "total_steps": 93654, "loss": 0.7831, "learning_rate": 8.941207028333737e-06, "epoch": 2.1750272278813503, "percentage": 72.5, "elapsed_time": "6:46:31", "remaining_time": "2:34:11", "throughput": 22804.32, "total_tokens": 556236800} {"current_steps": 68000, "total_steps": 93654, "loss": 0.829, "learning_rate": 8.876333353781468e-06, "epoch": 2.178230508040233, "percentage": 72.61, "elapsed_time": "6:54:19", "remaining_time": "2:36:18", "throughput": 22407.77, "total_tokens": 557056000} {"current_steps": 68100, "total_steps": 93654, "loss": 0.8621, "learning_rate": 8.811645047241767e-06, "epoch": 2.181433788199116, "percentage": 72.71, "elapsed_time": "7:02:07", "remaining_time": "2:38:24", "throughput": 22026.27, "total_tokens": 557875200} {"current_steps": 68200, "total_steps": 93654, "loss": 0.8444, "learning_rate": 8.74714285241289e-06, "epoch": 2.1846370683579988, "percentage": 72.82, "elapsed_time": "7:09:55", "remaining_time": "2:40:27", "throughput": 21658.71, "total_tokens": 558694400} {"current_steps": 68300, "total_steps": 93654, "loss": 0.8286, "learning_rate": 8.682827510853426e-06, "epoch": 2.187840348516881, "percentage": 72.93, "elapsed_time": "7:17:44", "remaining_time": "2:42:29", "throughput": 21302.91, "total_tokens": 559513600} {"current_steps": 68400, "total_steps": 93654, "loss": 0.7787, "learning_rate": 8.618699761973792e-06, "epoch": 2.191043628675764, "percentage": 73.03, "elapsed_time": "7:26:26", "remaining_time": "2:44:49", "throughput": 20918.76, "total_tokens": 560332800} {"current_steps": 68500, "total_steps": 93654, "loss": 0.8595, "learning_rate": 8.554760343027724e-06, "epoch": 2.194246908834647, "percentage": 73.14, "elapsed_time": "7:36:39", "remaining_time": "2:47:41", "throughput": 20480.74, "total_tokens": 561152000} {"current_steps": 68600, "total_steps": 93654, "loss": 0.8538, "learning_rate": 8.491009989103796e-06, "epoch": 2.197450188993529, "percentage": 73.25, "elapsed_time": "7:44:46", "remaining_time": "2:49:44", "throughput": 20152.36, "total_tokens": 561971200} {"current_steps": 68100, "total_steps": 93654, "loss": 0.8623, "learning_rate": 8.811645047241767e-06, "epoch": 2.181433788199116, "percentage": 72.71, "elapsed_time": "0:08:11", "remaining_time": "0:03:04", "throughput": 1136184.88, "total_tokens": 557875200} {"current_steps": 68200, "total_steps": 93654, "loss": 0.8444, "learning_rate": 8.74714285241289e-06, "epoch": 2.1846370683579988, "percentage": 72.82, "elapsed_time": "0:16:12", "remaining_time": "0:06:02", "throughput": 574559.98, "total_tokens": 558694400} {"current_steps": 68300, "total_steps": 93654, "loss": 0.8287, "learning_rate": 8.682827510853426e-06, "epoch": 2.187840348516881, "percentage": 72.93, "elapsed_time": "0:24:10", "remaining_time": "0:08:58", "throughput": 385867.82, "total_tokens": 559513600} {"current_steps": 68400, "total_steps": 93654, "loss": 0.7785, "learning_rate": 8.618699761973792e-06, "epoch": 2.191043628675764, "percentage": 73.03, "elapsed_time": "0:32:06", "remaining_time": "0:11:51", "throughput": 290830.67, "total_tokens": 560332800} {"current_steps": 68500, "total_steps": 93654, "loss": 0.8595, "learning_rate": 8.554760343027724e-06, "epoch": 2.194246908834647, "percentage": 73.14, "elapsed_time": "0:40:01", "remaining_time": "0:14:41", "throughput": 233714.64, "total_tokens": 561152000} {"current_steps": 68600, "total_steps": 93654, "loss": 0.8538, "learning_rate": 8.491009989103796e-06, "epoch": 2.197450188993529, "percentage": 73.25, "elapsed_time": "0:48:01", "remaining_time": "0:17:32", "throughput": 195005.16, "total_tokens": 561971200} {"current_steps": 68700, "total_steps": 93654, "loss": 0.8333, "learning_rate": 8.427449433116952e-06, "epoch": 2.200653469152412, "percentage": 73.36, "elapsed_time": "0:56:06", "remaining_time": "0:20:22", "throughput": 167181.51, "total_tokens": 562790400} {"current_steps": 68800, "total_steps": 93654, "loss": 0.8281, "learning_rate": 8.364079405800105e-06, "epoch": 2.203856749311295, "percentage": 73.46, "elapsed_time": "1:04:11", "remaining_time": "0:23:11", "throughput": 146316.12, "total_tokens": 563609600} {"current_steps": 68900, "total_steps": 93654, "loss": 0.7887, "learning_rate": 8.30090063569573e-06, "epoch": 2.2070600294701777, "percentage": 73.57, "elapsed_time": "1:17:01", "remaining_time": "0:27:40", "throughput": 122124.13, "total_tokens": 564428800} {"current_steps": 69000, "total_steps": 93654, "loss": 0.8451, "learning_rate": 8.237913849147497e-06, "epoch": 2.21026330962906, "percentage": 73.68, "elapsed_time": "1:32:05", "remaining_time": "0:32:54", "throughput": 102290.62, "total_tokens": 565248000} {"current_steps": 69100, "total_steps": 93654, "loss": 0.8596, "learning_rate": 8.1751197702919e-06, "epoch": 2.213466589787943, "percentage": 73.78, "elapsed_time": "1:43:33", "remaining_time": "0:36:48", "throughput": 91096.63, "total_tokens": 566067200} {"current_steps": 69200, "total_steps": 93654, "loss": 0.8584, "learning_rate": 8.112519121049942e-06, "epoch": 2.2166698699468257, "percentage": 73.89, "elapsed_time": "2:03:08", "remaining_time": "0:43:31", "throughput": 76722.65, "total_tokens": 566886400} {"current_steps": 69300, "total_steps": 93654, "loss": 0.8518, "learning_rate": 8.050112621118822e-06, "epoch": 2.219873150105708, "percentage": 74.0, "elapsed_time": "2:12:03", "remaining_time": "0:46:24", "throughput": 71651.04, "total_tokens": 567705600} {"current_steps": 69400, "total_steps": 93654, "loss": 0.8544, "learning_rate": 7.987900987963695e-06, "epoch": 2.223076430264591, "percentage": 74.1, "elapsed_time": "2:20:08", "remaining_time": "0:48:58", "throughput": 67611.29, "total_tokens": 568524800} {"current_steps": 69500, "total_steps": 93654, "loss": 0.8395, "learning_rate": 7.925884936809396e-06, "epoch": 2.2262797104234737, "percentage": 74.21, "elapsed_time": "2:28:11", "remaining_time": "0:51:30", "throughput": 64033.5, "total_tokens": 569344000} {"current_steps": 69600, "total_steps": 93654, "loss": 0.8681, "learning_rate": 7.864065180632233e-06, "epoch": 2.2294829905823565, "percentage": 74.32, "elapsed_time": "2:36:30", "remaining_time": "0:54:05", "throughput": 60714.27, "total_tokens": 570163200} {"current_steps": 69700, "total_steps": 93654, "loss": 0.7735, "learning_rate": 7.802442430151757e-06, "epoch": 2.232686270741239, "percentage": 74.42, "elapsed_time": "2:44:36", "remaining_time": "0:56:34", "throughput": 57814.55, "total_tokens": 570982400} {"current_steps": 69800, "total_steps": 93654, "loss": 0.7853, "learning_rate": 7.741017393822628e-06, "epoch": 2.2358895509001218, "percentage": 74.53, "elapsed_time": "2:52:41", "remaining_time": "0:59:01", "throughput": 55182.81, "total_tokens": 571801600} {"current_steps": 69900, "total_steps": 93654, "loss": 0.8403, "learning_rate": 7.679790777826459e-06, "epoch": 2.2390928310590046, "percentage": 74.64, "elapsed_time": "3:00:48", "remaining_time": "1:01:26", "throughput": 52782.48, "total_tokens": 572620800} {"current_steps": 70000, "total_steps": 93654, "loss": 0.8336, "learning_rate": 7.618763286063698e-06, "epoch": 2.242296111217887, "percentage": 74.74, "elapsed_time": "3:09:46", "remaining_time": "1:04:07", "throughput": 50362.34, "total_tokens": 573440000} {"current_steps": 70100, "total_steps": 93654, "loss": 0.7682, "learning_rate": 7.55793562014554e-06, "epoch": 2.24549939137677, "percentage": 74.85, "elapsed_time": "3:18:12", "remaining_time": "1:06:35", "throughput": 48288.38, "total_tokens": 574259200} {"current_steps": 70200, "total_steps": 93654, "loss": 0.8367, "learning_rate": 7.497308479385831e-06, "epoch": 2.2487026715356526, "percentage": 74.96, "elapsed_time": "3:26:08", "remaining_time": "1:08:52", "throughput": 46495.35, "total_tokens": 575078400} {"current_steps": 70300, "total_steps": 93654, "loss": 0.8119, "learning_rate": 7.43688256079306e-06, "epoch": 2.2519059516945354, "percentage": 75.06, "elapsed_time": "3:34:15", "remaining_time": "1:11:10", "throughput": 44799.41, "total_tokens": 575897600} {"current_steps": 70400, "total_steps": 93654, "loss": 0.8231, "learning_rate": 7.376658559062349e-06, "epoch": 2.255109231853418, "percentage": 75.17, "elapsed_time": "3:42:18", "remaining_time": "1:13:26", "throughput": 43235.65, "total_tokens": 576716800} {"current_steps": 70500, "total_steps": 93654, "loss": 0.852, "learning_rate": 7.31663716656745e-06, "epoch": 2.2583125120123007, "percentage": 75.28, "elapsed_time": "3:50:32", "remaining_time": "1:15:42", "throughput": 41752.22, "total_tokens": 577536000} {"current_steps": 70600, "total_steps": 93654, "loss": 0.82, "learning_rate": 7.256819073352775e-06, "epoch": 2.2615157921711835, "percentage": 75.38, "elapsed_time": "3:58:33", "remaining_time": "1:17:53", "throughput": 40406.95, "total_tokens": 578355200} {"current_steps": 70700, "total_steps": 93654, "loss": 0.8417, "learning_rate": 7.197204967125498e-06, "epoch": 2.264719072330066, "percentage": 75.49, "elapsed_time": "4:06:36", "remaining_time": "1:20:03", "throughput": 39143.17, "total_tokens": 579174400} {"current_steps": 70800, "total_steps": 93654, "loss": 0.8252, "learning_rate": 7.137795533247604e-06, "epoch": 2.2679223524889487, "percentage": 75.6, "elapsed_time": "4:14:25", "remaining_time": "1:22:07", "throughput": 37993.62, "total_tokens": 579993600} {"current_steps": 70900, "total_steps": 93654, "loss": 0.8195, "learning_rate": 7.078591454728056e-06, "epoch": 2.2711256326478315, "percentage": 75.7, "elapsed_time": "4:22:13", "remaining_time": "1:24:09", "throughput": 36915.84, "total_tokens": 580812800} {"current_steps": 71000, "total_steps": 93654, "loss": 0.8012, "learning_rate": 7.019593412214914e-06, "epoch": 2.274328912806714, "percentage": 75.81, "elapsed_time": "4:29:58", "remaining_time": "1:26:08", "throughput": 35906.65, "total_tokens": 581632000} {"current_steps": 71100, "total_steps": 93654, "loss": 0.8097, "learning_rate": 6.960802083987503e-06, "epoch": 2.2775321929655967, "percentage": 75.92, "elapsed_time": "4:38:13", "remaining_time": "1:28:15", "throughput": 34890.14, "total_tokens": 582451200} {"current_steps": 71200, "total_steps": 93654, "loss": 0.8216, "learning_rate": 6.902218145948647e-06, "epoch": 2.2807354731244796, "percentage": 76.02, "elapsed_time": "4:46:00", "remaining_time": "1:30:11", "throughput": 33988.82, "total_tokens": 583270400} {"current_steps": 71300, "total_steps": 93654, "loss": 0.829, "learning_rate": 6.8438422716168595e-06, "epoch": 2.283938753283362, "percentage": 76.13, "elapsed_time": "4:53:48", "remaining_time": "1:32:06", "throughput": 33132.77, "total_tokens": 584089600} {"current_steps": 71400, "total_steps": 93654, "loss": 0.8557, "learning_rate": 6.785675132118638e-06, "epoch": 2.2871420334422448, "percentage": 76.24, "elapsed_time": "5:01:37", "remaining_time": "1:34:00", "throughput": 32319.75, "total_tokens": 584908800} {"current_steps": 71500, "total_steps": 93654, "loss": 0.8199, "learning_rate": 6.72771739618073e-06, "epoch": 2.2903453136011276, "percentage": 76.34, "elapsed_time": "5:09:23", "remaining_time": "1:35:51", "throughput": 31552.6, "total_tokens": 585728000} {"current_steps": 71600, "total_steps": 93654, "loss": 0.876, "learning_rate": 6.6699697301224214e-06, "epoch": 2.2935485937600104, "percentage": 76.45, "elapsed_time": "5:17:11", "remaining_time": "1:37:42", "throughput": 30819.88, "total_tokens": 586547200} {"current_steps": 71700, "total_steps": 93654, "loss": 0.8013, "learning_rate": 6.612432797847937e-06, "epoch": 2.296751873918893, "percentage": 76.56, "elapsed_time": "5:24:58", "remaining_time": "1:39:30", "throughput": 30123.78, "total_tokens": 587366400} {"current_steps": 71800, "total_steps": 93654, "loss": 0.7922, "learning_rate": 6.55510726083873e-06, "epoch": 2.2999551540777756, "percentage": 76.67, "elapsed_time": "5:32:45", "remaining_time": "1:41:16", "throughput": 29460.08, "total_tokens": 588185600} {"current_steps": 71900, "total_steps": 93654, "loss": 0.7617, "learning_rate": 6.4979937781459586e-06, "epoch": 2.3031584342366584, "percentage": 76.77, "elapsed_time": "5:40:31", "remaining_time": "1:43:01", "throughput": 28828.73, "total_tokens": 589004800} {"current_steps": 72000, "total_steps": 93654, "loss": 0.8744, "learning_rate": 6.441093006382831e-06, "epoch": 2.306361714395541, "percentage": 76.88, "elapsed_time": "5:48:22", "remaining_time": "1:44:46", "throughput": 28217.63, "total_tokens": 589824000} {"current_steps": 72100, "total_steps": 93654, "loss": 0.7952, "learning_rate": 6.384405599717125e-06, "epoch": 2.3095649945544237, "percentage": 76.99, "elapsed_time": "5:56:09", "remaining_time": "1:46:28", "throughput": 27639.48, "total_tokens": 590643200} {"current_steps": 72200, "total_steps": 93654, "loss": 0.817, "learning_rate": 6.327932209863618e-06, "epoch": 2.3127682747133065, "percentage": 77.09, "elapsed_time": "6:03:54", "remaining_time": "1:48:08", "throughput": 27088.25, "total_tokens": 591462400} {"current_steps": 72300, "total_steps": 93654, "loss": 0.8127, "learning_rate": 6.271673486076629e-06, "epoch": 2.3159715548721893, "percentage": 77.2, "elapsed_time": "6:11:41", "remaining_time": "1:49:46", "throughput": 26557.63, "total_tokens": 592281600} {"current_steps": 72400, "total_steps": 93654, "loss": 0.8191, "learning_rate": 6.215630075142523e-06, "epoch": 2.3191748350310717, "percentage": 77.31, "elapsed_time": "6:19:27", "remaining_time": "1:51:23", "throughput": 26049.8, "total_tokens": 593100800} {"current_steps": 72500, "total_steps": 93654, "loss": 0.831, "learning_rate": 6.159802621372279e-06, "epoch": 2.3223781151899545, "percentage": 77.41, "elapsed_time": "6:27:14", "remaining_time": "1:52:59", "throughput": 25562.52, "total_tokens": 593920000} {"current_steps": 72600, "total_steps": 93654, "loss": 0.8249, "learning_rate": 6.1041917665941275e-06, "epoch": 2.3255813953488373, "percentage": 77.52, "elapsed_time": "6:35:01", "remaining_time": "1:54:33", "throughput": 25093.29, "total_tokens": 594739200} {"current_steps": 72700, "total_steps": 93654, "loss": 0.7416, "learning_rate": 6.048798150146112e-06, "epoch": 2.3287846755077197, "percentage": 77.63, "elapsed_time": "6:42:45", "remaining_time": "1:56:05", "throughput": 24644.6, "total_tokens": 595558400} {"current_steps": 72800, "total_steps": 93654, "loss": 0.8451, "learning_rate": 5.993622408868788e-06, "epoch": 2.3319879556666026, "percentage": 77.73, "elapsed_time": "6:50:33", "remaining_time": "1:57:36", "throughput": 24210.19, "total_tokens": 596377600} {"current_steps": 72900, "total_steps": 93654, "loss": 0.8654, "learning_rate": 5.9386651770978516e-06, "epoch": 2.3351912358254854, "percentage": 77.84, "elapsed_time": "6:58:20", "remaining_time": "1:59:05", "throughput": 23791.88, "total_tokens": 597196800} {"current_steps": 73000, "total_steps": 93654, "loss": 0.8397, "learning_rate": 5.8839270866568816e-06, "epoch": 2.338394515984368, "percentage": 77.95, "elapsed_time": "7:06:08", "remaining_time": "2:00:34", "throughput": 23388.41, "total_tokens": 598016000} {"current_steps": 73100, "total_steps": 93654, "loss": 0.833, "learning_rate": 5.829408766850078e-06, "epoch": 2.3415977961432506, "percentage": 78.05, "elapsed_time": "7:14:07", "remaining_time": "2:02:03", "throughput": 22989.95, "total_tokens": 598835200} {"current_steps": 73200, "total_steps": 93654, "loss": 0.8174, "learning_rate": 5.7751108444550066e-06, "epoch": 2.3448010763021334, "percentage": 78.16, "elapsed_time": "7:21:55", "remaining_time": "2:03:29", "throughput": 22615.03, "total_tokens": 599654400} {"current_steps": 73300, "total_steps": 93654, "loss": 0.7809, "learning_rate": 5.7210339437154175e-06, "epoch": 2.3480043564610162, "percentage": 78.27, "elapsed_time": "7:29:43", "remaining_time": "2:04:52", "throughput": 22253.77, "total_tokens": 600473600} {"current_steps": 73400, "total_steps": 93654, "loss": 0.8243, "learning_rate": 5.667178686334037e-06, "epoch": 2.3512076366198986, "percentage": 78.37, "elapsed_time": "7:37:30", "remaining_time": "2:06:14", "throughput": 21904.53, "total_tokens": 601292800} {"current_steps": 73500, "total_steps": 93654, "loss": 0.7868, "learning_rate": 5.613545691465438e-06, "epoch": 2.3544109167787814, "percentage": 78.48, "elapsed_time": "7:45:17", "remaining_time": "2:07:35", "throughput": 21567.23, "total_tokens": 602112000} {"current_steps": 73600, "total_steps": 93654, "loss": 0.8176, "learning_rate": 5.560135575708927e-06, "epoch": 2.3576141969376643, "percentage": 78.59, "elapsed_time": "7:53:05", "remaining_time": "2:08:54", "throughput": 21240.6, "total_tokens": 602931200} {"current_steps": 73700, "total_steps": 93654, "loss": 0.8417, "learning_rate": 5.506948953101454e-06, "epoch": 2.360817477096547, "percentage": 78.69, "elapsed_time": "8:00:52", "remaining_time": "2:10:11", "throughput": 20925.4, "total_tokens": 603750400} {"current_steps": 73800, "total_steps": 93654, "loss": 0.8552, "learning_rate": 5.45398643511055e-06, "epoch": 2.3640207572554295, "percentage": 78.8, "elapsed_time": "8:08:39", "remaining_time": "2:11:27", "throughput": 20620.3, "total_tokens": 604569600} {"current_steps": 73900, "total_steps": 93654, "loss": 0.8423, "learning_rate": 5.401248630627282e-06, "epoch": 2.3672240374143123, "percentage": 78.91, "elapsed_time": "8:16:25", "remaining_time": "2:12:41", "throughput": 20325.04, "total_tokens": 605388800} {"current_steps": 74000, "total_steps": 93654, "loss": 0.8278, "learning_rate": 5.3487361459592626e-06, "epoch": 2.370427317573195, "percentage": 79.01, "elapsed_time": "8:24:10", "remaining_time": "2:13:54", "throughput": 20039.72, "total_tokens": 606208000} {"current_steps": 74100, "total_steps": 93654, "loss": 0.8354, "learning_rate": 5.296449584823707e-06, "epoch": 2.3736305977320775, "percentage": 79.12, "elapsed_time": "8:32:10", "remaining_time": "2:15:09", "throughput": 19752.97, "total_tokens": 607027200} {"current_steps": 74200, "total_steps": 93654, "loss": 0.8292, "learning_rate": 5.244389548340456e-06, "epoch": 2.3768338778909603, "percentage": 79.23, "elapsed_time": "8:39:57", "remaining_time": "2:16:19", "throughput": 19483.85, "total_tokens": 607846400} {"current_steps": 74300, "total_steps": 93654, "loss": 0.8604, "learning_rate": 5.19255663502507e-06, "epoch": 2.380037158049843, "percentage": 79.33, "elapsed_time": "8:47:47", "remaining_time": "2:17:28", "throughput": 19220.61, "total_tokens": 608665600} {"current_steps": 74400, "total_steps": 93654, "loss": 0.8464, "learning_rate": 5.1409514407819745e-06, "epoch": 2.3832404382087256, "percentage": 79.44, "elapsed_time": "8:55:36", "remaining_time": "2:18:36", "throughput": 18965.76, "total_tokens": 609484800} {"current_steps": 74500, "total_steps": 93654, "loss": 0.8711, "learning_rate": 5.089574558897564e-06, "epoch": 2.3864437183676084, "percentage": 79.55, "elapsed_time": "9:03:23", "remaining_time": "2:19:42", "throughput": 18718.99, "total_tokens": 610304000} {"current_steps": 74600, "total_steps": 93654, "loss": 0.8357, "learning_rate": 5.038426580033431e-06, "epoch": 2.389646998526491, "percentage": 79.65, "elapsed_time": "9:11:11", "remaining_time": "2:20:46", "throughput": 18479.0, "total_tokens": 611123200} {"current_steps": 74700, "total_steps": 93654, "loss": 0.8782, "learning_rate": 4.98750809221955e-06, "epoch": 2.3928502786853736, "percentage": 79.76, "elapsed_time": "9:18:59", "remaining_time": "2:21:50", "throughput": 18245.34, "total_tokens": 611942400} {"current_steps": 74800, "total_steps": 93654, "loss": 0.8051, "learning_rate": 4.936819680847499e-06, "epoch": 2.3960535588442564, "percentage": 79.87, "elapsed_time": "9:26:45", "remaining_time": "2:22:51", "throughput": 18019.58, "total_tokens": 612761600} {"current_steps": 74900, "total_steps": 93654, "loss": 0.8208, "learning_rate": 4.886361928663779e-06, "epoch": 2.3992568390031392, "percentage": 79.98, "elapsed_time": "9:34:32", "remaining_time": "2:23:51", "throughput": 17799.22, "total_tokens": 613580800} {"current_steps": 75000, "total_steps": 93654, "loss": 0.8081, "learning_rate": 4.836135415763054e-06, "epoch": 2.402460119162022, "percentage": 80.08, "elapsed_time": "9:42:18", "remaining_time": "2:24:49", "throughput": 17585.02, "total_tokens": 614400000} {"current_steps": 75100, "total_steps": 93654, "loss": 0.8612, "learning_rate": 4.786140719581539e-06, "epoch": 2.4056633993209044, "percentage": 80.19, "elapsed_time": "9:50:20", "remaining_time": "2:25:50", "throughput": 17369.2, "total_tokens": 615219200} {"current_steps": 75200, "total_steps": 93654, "loss": 0.8201, "learning_rate": 4.73637841489033e-06, "epoch": 2.4088666794797873, "percentage": 80.3, "elapsed_time": "9:58:06", "remaining_time": "2:26:46", "throughput": 17166.24, "total_tokens": 616038400} {"current_steps": 75300, "total_steps": 93654, "loss": 0.8319, "learning_rate": 4.686849073788782e-06, "epoch": 2.41206995963867, "percentage": 80.4, "elapsed_time": "10:05:54", "remaining_time": "2:27:41", "throughput": 16967.72, "total_tokens": 616857600} {"current_steps": 75400, "total_steps": 93654, "loss": 0.8012, "learning_rate": 4.637553265697978e-06, "epoch": 2.4152732397975525, "percentage": 80.51, "elapsed_time": "10:13:41", "remaining_time": "2:28:34", "throughput": 16774.86, "total_tokens": 617676800} {"current_steps": 75500, "total_steps": 93654, "loss": 0.8216, "learning_rate": 4.5884915573541326e-06, "epoch": 2.4184765199564353, "percentage": 80.62, "elapsed_time": "10:21:28", "remaining_time": "2:29:25", "throughput": 16586.84, "total_tokens": 618496000} {"current_steps": 75600, "total_steps": 93654, "loss": 0.8269, "learning_rate": 4.539664512802125e-06, "epoch": 2.421679800115318, "percentage": 80.72, "elapsed_time": "10:29:15", "remaining_time": "2:30:16", "throughput": 16403.53, "total_tokens": 619315200} {"current_steps": 75700, "total_steps": 93654, "loss": 0.7949, "learning_rate": 4.491072693388957e-06, "epoch": 2.424883080274201, "percentage": 80.83, "elapsed_time": "10:37:00", "remaining_time": "2:31:04", "throughput": 16225.04, "total_tokens": 620134400} {"current_steps": 75800, "total_steps": 93654, "loss": 0.8153, "learning_rate": 4.442716657757354e-06, "epoch": 2.4280863604330833, "percentage": 80.94, "elapsed_time": "10:44:47", "remaining_time": "2:31:52", "throughput": 16050.37, "total_tokens": 620953600} {"current_steps": 75900, "total_steps": 93654, "loss": 0.8063, "learning_rate": 4.3945969618393255e-06, "epoch": 2.431289640591966, "percentage": 81.04, "elapsed_time": "10:52:34", "remaining_time": "2:32:38", "throughput": 15880.14, "total_tokens": 621772800} {"current_steps": 76000, "total_steps": 93654, "loss": 0.7779, "learning_rate": 4.346714158849744e-06, "epoch": 2.434492920750849, "percentage": 81.15, "elapsed_time": "11:00:22", "remaining_time": "2:33:23", "throughput": 15713.1, "total_tokens": 622592000} {"current_steps": 76100, "total_steps": 93654, "loss": 0.8322, "learning_rate": 4.299068799280032e-06, "epoch": 2.4376962009097314, "percentage": 81.26, "elapsed_time": "11:08:17", "remaining_time": "2:34:09", "throughput": 15547.46, "total_tokens": 623411200} {"current_steps": 76200, "total_steps": 93654, "loss": 0.8294, "learning_rate": 4.251661430891787e-06, "epoch": 2.440899481068614, "percentage": 81.36, "elapsed_time": "11:16:05", "remaining_time": "2:34:51", "throughput": 15388.18, "total_tokens": 624230400} {"current_steps": 76300, "total_steps": 93654, "loss": 0.819, "learning_rate": 4.20449259871053e-06, "epoch": 2.444102761227497, "percentage": 81.47, "elapsed_time": "11:23:50", "remaining_time": "2:35:32", "throughput": 15233.71, "total_tokens": 625049600} {"current_steps": 76400, "total_steps": 93654, "loss": 0.7969, "learning_rate": 4.157562845019405e-06, "epoch": 2.44730604138638, "percentage": 81.58, "elapsed_time": "11:31:37", "remaining_time": "2:36:11", "throughput": 15082.08, "total_tokens": 625868800} {"current_steps": 76500, "total_steps": 93654, "loss": 0.8516, "learning_rate": 4.1108727093529644e-06, "epoch": 2.4505093215452622, "percentage": 81.68, "elapsed_time": "11:39:24", "remaining_time": "2:36:49", "throughput": 14933.68, "total_tokens": 626688000} {"current_steps": 76600, "total_steps": 93654, "loss": 0.8471, "learning_rate": 4.064422728490946e-06, "epoch": 2.453712601704145, "percentage": 81.79, "elapsed_time": "11:47:12", "remaining_time": "2:37:27", "throughput": 14788.23, "total_tokens": 627507200} {"current_steps": 76700, "total_steps": 93654, "loss": 0.84, "learning_rate": 4.018213436452117e-06, "epoch": 2.456915881863028, "percentage": 81.9, "elapsed_time": "11:55:02", "remaining_time": "2:38:03", "throughput": 14645.39, "total_tokens": 628326400} {"current_steps": 76800, "total_steps": 93654, "loss": 0.8224, "learning_rate": 3.972245364488136e-06, "epoch": 2.4601191620219103, "percentage": 82.0, "elapsed_time": "12:02:49", "remaining_time": "2:38:37", "throughput": 14506.77, "total_tokens": 629145600} {"current_steps": 76900, "total_steps": 93654, "loss": 0.8476, "learning_rate": 3.926519041077445e-06, "epoch": 2.463322442180793, "percentage": 82.11, "elapsed_time": "12:10:36", "remaining_time": "2:39:10", "throughput": 14370.77, "total_tokens": 629964800} {"current_steps": 77000, "total_steps": 93654, "loss": 0.8256, "learning_rate": 3.8810349919191825e-06, "epoch": 2.466525722339676, "percentage": 82.22, "elapsed_time": "12:18:24", "remaining_time": "2:39:42", "throughput": 14237.6, "total_tokens": 630784000} {"current_steps": 77100, "total_steps": 93654, "loss": 0.8494, "learning_rate": 3.835793739927151e-06, "epoch": 2.4697290024985588, "percentage": 82.32, "elapsed_time": "12:26:12", "remaining_time": "2:40:13", "throughput": 14106.93, "total_tokens": 631603200} {"current_steps": 77100, "total_steps": 93654, "loss": 0.8493, "learning_rate": 3.835793739927151e-06, "epoch": 2.4697290024985588, "percentage": 82.32, "elapsed_time": "0:08:00", "remaining_time": "0:01:43", "throughput": 1315043.39, "total_tokens": 631603200} {"current_steps": 77200, "total_steps": 93654, "loss": 0.8275, "learning_rate": 3.7907958052237875e-06, "epoch": 2.472932282657441, "percentage": 82.43, "elapsed_time": "0:15:48", "remaining_time": "0:03:22", "throughput": 666880.7, "total_tokens": 632422400} {"current_steps": 77300, "total_steps": 93654, "loss": 0.8628, "learning_rate": 3.746041705134215e-06, "epoch": 2.476135562816324, "percentage": 82.54, "elapsed_time": "0:23:38", "remaining_time": "0:05:00", "throughput": 446390.36, "total_tokens": 633241600} {"current_steps": 77400, "total_steps": 93654, "loss": 0.8246, "learning_rate": 3.7015319541802708e-06, "epoch": 2.479338842975207, "percentage": 82.64, "elapsed_time": "0:31:26", "remaining_time": "0:06:36", "throughput": 336158.63, "total_tokens": 634060800} {"current_steps": 77500, "total_steps": 93654, "loss": 0.806, "learning_rate": 3.657267064074607e-06, "epoch": 2.482542123134089, "percentage": 82.75, "elapsed_time": "0:39:30", "remaining_time": "0:08:14", "throughput": 267831.46, "total_tokens": 634880000} {"current_steps": 77600, "total_steps": 93654, "loss": 0.8068, "learning_rate": 3.613247543714779e-06, "epoch": 2.485745403292972, "percentage": 82.86, "elapsed_time": "0:47:36", "remaining_time": "0:09:50", "throughput": 222544.85, "total_tokens": 635699200} {"current_steps": 77700, "total_steps": 93654, "loss": 0.7704, "learning_rate": 3.5694738991774197e-06, "epoch": 2.488948683451855, "percentage": 82.96, "elapsed_time": "0:55:42", "remaining_time": "0:11:26", "throughput": 190459.51, "total_tokens": 636518400} {"current_steps": 77800, "total_steps": 93654, "loss": 0.8625, "learning_rate": 3.5259466337124293e-06, "epoch": 2.492151963610737, "percentage": 83.07, "elapsed_time": "1:03:53", "remaining_time": "0:13:01", "throughput": 166250.66, "total_tokens": 637337600} {"current_steps": 77900, "total_steps": 93654, "loss": 0.8093, "learning_rate": 3.4826662477371624e-06, "epoch": 2.49535524376962, "percentage": 83.18, "elapsed_time": "1:11:59", "remaining_time": "0:14:33", "throughput": 147747.02, "total_tokens": 638156800} {"current_steps": 78000, "total_steps": 93654, "loss": 0.8533, "learning_rate": 3.4396332388307057e-06, "epoch": 2.498558523928503, "percentage": 83.29, "elapsed_time": "1:20:07", "remaining_time": "0:16:04", "throughput": 132918.45, "total_tokens": 638976000} {"current_steps": 78100, "total_steps": 93654, "loss": 0.8254, "learning_rate": 3.3968481017281173e-06, "epoch": 2.5017618040873852, "percentage": 83.39, "elapsed_time": "1:28:15", "remaining_time": "0:17:34", "throughput": 120814.18, "total_tokens": 639795200} {"current_steps": 78200, "total_steps": 93654, "loss": 0.8311, "learning_rate": 3.3543113283147687e-06, "epoch": 2.504965084246268, "percentage": 83.5, "elapsed_time": "1:36:22", "remaining_time": "0:19:02", "throughput": 110785.38, "total_tokens": 640614400} {"current_steps": 78300, "total_steps": 93654, "loss": 0.8285, "learning_rate": 3.3120234076206987e-06, "epoch": 2.508168364405151, "percentage": 83.61, "elapsed_time": "1:44:40", "remaining_time": "0:20:31", "throughput": 102129.95, "total_tokens": 641433600} {"current_steps": 78400, "total_steps": 93654, "loss": 0.8276, "learning_rate": 3.2699848258149617e-06, "epoch": 2.5113716445640337, "percentage": 83.71, "elapsed_time": "1:53:07", "remaining_time": "0:22:00", "throughput": 94623.21, "total_tokens": 642252800} {"current_steps": 78500, "total_steps": 93654, "loss": 0.7989, "learning_rate": 3.228196066200051e-06, "epoch": 2.514574924722916, "percentage": 83.82, "elapsed_time": "2:01:36", "remaining_time": "0:23:28", "throughput": 88131.05, "total_tokens": 643072000} {"current_steps": 78600, "total_steps": 93654, "loss": 0.8165, "learning_rate": 3.186657609206353e-06, "epoch": 2.517778204881799, "percentage": 83.93, "elapsed_time": "2:10:04", "remaining_time": "0:24:54", "throughput": 82500.17, "total_tokens": 643891200} {"current_steps": 78700, "total_steps": 93654, "loss": 0.8476, "learning_rate": 3.1453699323866047e-06, "epoch": 2.5209814850406818, "percentage": 84.03, "elapsed_time": "2:18:35", "remaining_time": "0:26:20", "throughput": 77529.64, "total_tokens": 644710400} {"current_steps": 78800, "total_steps": 93654, "loss": 0.8386, "learning_rate": 3.1043335104104233e-06, "epoch": 2.524184765199564, "percentage": 84.14, "elapsed_time": "2:28:56", "remaining_time": "0:28:04", "throughput": 72237.66, "total_tokens": 645529600} {"current_steps": 78900, "total_steps": 93654, "loss": 0.8198, "learning_rate": 3.0635488150588338e-06, "epoch": 2.527388045358447, "percentage": 84.25, "elapsed_time": "2:38:16", "remaining_time": "0:29:35", "throughput": 68064.98, "total_tokens": 646348800} {"current_steps": 79000, "total_steps": 93654, "loss": 0.8364, "learning_rate": 3.0230163152188463e-06, "epoch": 2.53059132551733, "percentage": 84.35, "elapsed_time": "2:49:19", "remaining_time": "0:31:24", "throughput": 63699.55, "total_tokens": 647168000} {"current_steps": 79100, "total_steps": 93654, "loss": 0.7922, "learning_rate": 2.9827364768780814e-06, "epoch": 2.5337946056762126, "percentage": 84.46, "elapsed_time": "2:59:57", "remaining_time": "0:33:06", "throughput": 60009.96, "total_tokens": 647987200} {"current_steps": 79200, "total_steps": 93654, "loss": 0.7829, "learning_rate": 2.942709763119386e-06, "epoch": 2.536997885835095, "percentage": 84.57, "elapsed_time": "3:11:04", "remaining_time": "0:34:52", "throughput": 56594.77, "total_tokens": 648806400} {"current_steps": 79300, "total_steps": 93654, "loss": 0.8196, "learning_rate": 2.9029366341155356e-06, "epoch": 2.540201165993978, "percentage": 84.67, "elapsed_time": "3:22:21", "remaining_time": "0:36:37", "throughput": 53503.93, "total_tokens": 649625600} {"current_steps": 79400, "total_steps": 93654, "loss": 0.788, "learning_rate": 2.863417547123934e-06, "epoch": 2.5434044461528607, "percentage": 84.78, "elapsed_time": "3:33:29", "remaining_time": "0:38:19", "throughput": 50777.05, "total_tokens": 650444800} {"current_steps": 79500, "total_steps": 93654, "loss": 0.8414, "learning_rate": 2.8241529564813434e-06, "epoch": 2.546607726311743, "percentage": 84.89, "elapsed_time": "3:44:39", "remaining_time": "0:39:59", "throughput": 48313.48, "total_tokens": 651264000} {"current_steps": 79600, "total_steps": 93654, "loss": 0.851, "learning_rate": 2.7851433135986843e-06, "epoch": 2.549811006470626, "percentage": 84.99, "elapsed_time": "3:54:04", "remaining_time": "0:41:19", "throughput": 46429.68, "total_tokens": 652083200} {"current_steps": 79700, "total_steps": 93654, "loss": 0.8379, "learning_rate": 2.7463890669558263e-06, "epoch": 2.5530142866295087, "percentage": 85.1, "elapsed_time": "4:02:45", "remaining_time": "0:42:30", "throughput": 44826.15, "total_tokens": 652902400} {"current_steps": 79800, "total_steps": 93654, "loss": 0.7906, "learning_rate": 2.707890662096452e-06, "epoch": 2.5562175667883915, "percentage": 85.21, "elapsed_time": "4:11:32", "remaining_time": "0:43:40", "throughput": 43315.54, "total_tokens": 653721600} {"current_steps": 79900, "total_steps": 93654, "loss": 0.8011, "learning_rate": 2.6696485416228987e-06, "epoch": 2.559420846947274, "percentage": 85.31, "elapsed_time": "4:20:09", "remaining_time": "0:44:46", "throughput": 41933.06, "total_tokens": 654540800} {"current_steps": 79100, "total_steps": 93654, "loss": 0.7922, "learning_rate": 2.9827364768780814e-06, "epoch": 2.5337946056762126, "percentage": 84.46, "elapsed_time": "0:08:27", "remaining_time": "0:01:33", "throughput": 1277675.65, "total_tokens": 647987200} {"current_steps": 79200, "total_steps": 93654, "loss": 0.7829, "learning_rate": 2.942709763119386e-06, "epoch": 2.536997885835095, "percentage": 84.57, "elapsed_time": "0:17:24", "remaining_time": "0:03:10", "throughput": 621305.09, "total_tokens": 648806400} {"current_steps": 79300, "total_steps": 93654, "loss": 0.8196, "learning_rate": 2.9029366341155356e-06, "epoch": 2.540201165993978, "percentage": 84.67, "elapsed_time": "0:26:02", "remaining_time": "0:04:42", "throughput": 415733.18, "total_tokens": 649625600} {"current_steps": 79400, "total_steps": 93654, "loss": 0.788, "learning_rate": 2.863417547123934e-06, "epoch": 2.5434044461528607, "percentage": 84.78, "elapsed_time": "0:34:26", "remaining_time": "0:06:10", "throughput": 314780.78, "total_tokens": 650444800} {"current_steps": 79500, "total_steps": 93654, "loss": 0.8413, "learning_rate": 2.8241529564813434e-06, "epoch": 2.546607726311743, "percentage": 84.89, "elapsed_time": "0:43:09", "remaining_time": "0:07:41", "throughput": 251507.63, "total_tokens": 651264000} {"current_steps": 79600, "total_steps": 93654, "loss": 0.851, "learning_rate": 2.7851433135986843e-06, "epoch": 2.549811006470626, "percentage": 84.99, "elapsed_time": "0:51:38", "remaining_time": "0:09:07", "throughput": 210434.2, "total_tokens": 652083200} {"current_steps": 79700, "total_steps": 93654, "loss": 0.8379, "learning_rate": 2.7463890669558263e-06, "epoch": 2.5530142866295087, "percentage": 85.1, "elapsed_time": "0:59:51", "remaining_time": "0:10:28", "throughput": 181779.02, "total_tokens": 652902400} {"current_steps": 79800, "total_steps": 93654, "loss": 0.7906, "learning_rate": 2.707890662096452e-06, "epoch": 2.5562175667883915, "percentage": 85.21, "elapsed_time": "1:07:31", "remaining_time": "0:11:43", "throughput": 161356.22, "total_tokens": 653721600} {"current_steps": 79900, "total_steps": 93654, "loss": 0.8011, "learning_rate": 2.6696485416228987e-06, "epoch": 2.559420846947274, "percentage": 85.31, "elapsed_time": "1:15:09", "remaining_time": "0:12:56", "throughput": 145146.48, "total_tokens": 654540800} {"current_steps": 80000, "total_steps": 93654, "loss": 0.8328, "learning_rate": 2.6316631451911213e-06, "epoch": 2.5626241271061567, "percentage": 85.42, "elapsed_time": "1:22:48", "remaining_time": "0:14:07", "throughput": 131904.96, "total_tokens": 655360000} {"current_steps": 80100, "total_steps": 93654, "loss": 0.8896, "learning_rate": 2.593934909505602e-06, "epoch": 2.5658274072650396, "percentage": 85.53, "elapsed_time": "1:30:31", "remaining_time": "0:15:19", "throughput": 120809.53, "total_tokens": 656179200} {"current_steps": 80200, "total_steps": 93654, "loss": 0.8405, "learning_rate": 2.5564642683143263e-06, "epoch": 2.569030687423922, "percentage": 85.63, "elapsed_time": "1:38:33", "remaining_time": "0:16:32", "throughput": 111099.78, "total_tokens": 656998400} {"current_steps": 80300, "total_steps": 93654, "loss": 0.8639, "learning_rate": 2.51925165240382e-06, "epoch": 2.5722339675828048, "percentage": 85.74, "elapsed_time": "1:46:45", "remaining_time": "0:17:45", "throughput": 102697.89, "total_tokens": 657817600} {"current_steps": 80400, "total_steps": 93654, "loss": 0.813, "learning_rate": 2.482297489594182e-06, "epoch": 2.5754372477416876, "percentage": 85.85, "elapsed_time": "1:54:55", "remaining_time": "0:18:56", "throughput": 95516.09, "total_tokens": 658636800} {"current_steps": 80500, "total_steps": 93654, "loss": 0.8494, "learning_rate": 2.4456022047341653e-06, "epoch": 2.5786405279005704, "percentage": 85.95, "elapsed_time": "2:03:05", "remaining_time": "0:20:06", "throughput": 89291.58, "total_tokens": 659456000} {"current_steps": 80600, "total_steps": 93654, "loss": 0.8748, "learning_rate": 2.4091662196963014e-06, "epoch": 2.581843808059453, "percentage": 86.06, "elapsed_time": "2:10:46", "remaining_time": "0:21:10", "throughput": 84148.87, "total_tokens": 660275200} {"current_steps": 80700, "total_steps": 93654, "loss": 0.8254, "learning_rate": 2.3729899533720485e-06, "epoch": 2.5850470882183356, "percentage": 86.17, "elapsed_time": "2:18:22", "remaining_time": "0:22:12", "throughput": 79622.35, "total_tokens": 661094400} {"current_steps": 80800, "total_steps": 93654, "loss": 0.8373, "learning_rate": 2.3370738216669574e-06, "epoch": 2.588250368377218, "percentage": 86.28, "elapsed_time": "2:26:02", "remaining_time": "0:23:13", "throughput": 75542.84, "total_tokens": 661913600} {"current_steps": 80900, "total_steps": 93654, "loss": 0.7675, "learning_rate": 2.3014182374959116e-06, "epoch": 2.591453648536101, "percentage": 86.38, "elapsed_time": "2:33:38", "remaining_time": "0:24:13", "throughput": 71893.6, "total_tokens": 662732800} {"current_steps": 81000, "total_steps": 93654, "loss": 0.8264, "learning_rate": 2.2660236107783783e-06, "epoch": 2.5946569286949837, "percentage": 86.49, "elapsed_time": "2:41:15", "remaining_time": "0:25:11", "throughput": 68579.72, "total_tokens": 663552000} {"current_steps": 81100, "total_steps": 93654, "loss": 0.8579, "learning_rate": 2.230890348433684e-06, "epoch": 2.5978602088538665, "percentage": 86.6, "elapsed_time": "2:48:56", "remaining_time": "0:26:09", "throughput": 65544.03, "total_tokens": 664371200} {"current_steps": 81200, "total_steps": 93654, "loss": 0.8412, "learning_rate": 2.1960188543763526e-06, "epoch": 2.6010634890127493, "percentage": 86.7, "elapsed_time": "2:56:33", "remaining_time": "0:27:04", "throughput": 62794.23, "total_tokens": 665190400} {"current_steps": 81300, "total_steps": 93654, "loss": 0.7985, "learning_rate": 2.161409529511438e-06, "epoch": 2.6042667691716317, "percentage": 86.81, "elapsed_time": "3:04:08", "remaining_time": "0:27:58", "throughput": 60281.51, "total_tokens": 666009600} {"current_steps": 81400, "total_steps": 93654, "loss": 0.8033, "learning_rate": 2.127062771729929e-06, "epoch": 2.6074700493305145, "percentage": 86.92, "elapsed_time": "3:11:44", "remaining_time": "0:28:51", "throughput": 57964.89, "total_tokens": 666828800} {"current_steps": 81500, "total_steps": 93654, "loss": 0.8538, "learning_rate": 2.092978975904189e-06, "epoch": 2.610673329489397, "percentage": 87.02, "elapsed_time": "3:19:22", "remaining_time": "0:29:44", "throughput": 55809.6, "total_tokens": 667648000} {"current_steps": 81600, "total_steps": 93654, "loss": 0.8805, "learning_rate": 2.059158533883393e-06, "epoch": 2.6138766096482797, "percentage": 87.13, "elapsed_time": "3:27:00", "remaining_time": "0:30:34", "throughput": 53820.37, "total_tokens": 668467200} {"current_steps": 81700, "total_steps": 93654, "loss": 0.8837, "learning_rate": 2.025601834489038e-06, "epoch": 2.6170798898071626, "percentage": 87.24, "elapsed_time": "3:34:55", "remaining_time": "0:31:26", "throughput": 51901.35, "total_tokens": 669286400} {"current_steps": 81800, "total_steps": 93654, "loss": 0.7892, "learning_rate": 1.9923092635104557e-06, "epoch": 2.6202831699660454, "percentage": 87.34, "elapsed_time": "3:42:33", "remaining_time": "0:32:15", "throughput": 50180.49, "total_tokens": 670105600} {"current_steps": 81900, "total_steps": 93654, "loss": 0.774, "learning_rate": 1.9592812037003918e-06, "epoch": 2.6234864501249278, "percentage": 87.45, "elapsed_time": "3:50:09", "remaining_time": "0:33:01", "throughput": 48584.35, "total_tokens": 670924800} {"current_steps": 82000, "total_steps": 93654, "loss": 0.8393, "learning_rate": 1.9265180347706053e-06, "epoch": 2.6266897302838106, "percentage": 87.56, "elapsed_time": "3:57:48", "remaining_time": "0:33:47", "throughput": 47078.61, "total_tokens": 671744000} {"current_steps": 82100, "total_steps": 93654, "loss": 0.8398, "learning_rate": 1.894020133387503e-06, "epoch": 2.6298930104426934, "percentage": 87.66, "elapsed_time": "4:05:49", "remaining_time": "0:34:35", "throughput": 45599.35, "total_tokens": 672563200} {"current_steps": 82200, "total_steps": 93654, "loss": 0.8031, "learning_rate": 1.8617878731678e-06, "epoch": 2.633096290601576, "percentage": 87.77, "elapsed_time": "4:13:54", "remaining_time": "0:35:22", "throughput": 44202.2, "total_tokens": 673382400} {"current_steps": 82300, "total_steps": 93654, "loss": 0.831, "learning_rate": 1.8298216246742329e-06, "epoch": 2.6362995707604586, "percentage": 87.88, "elapsed_time": "4:21:58", "remaining_time": "0:36:08", "throughput": 42890.93, "total_tokens": 674201600} {"current_steps": 82400, "total_steps": 93654, "loss": 0.8778, "learning_rate": 1.798121755411289e-06, "epoch": 2.6395028509193414, "percentage": 87.98, "elapsed_time": "4:30:11", "remaining_time": "0:36:54", "throughput": 41638.13, "total_tokens": 675020800} {"current_steps": 82500, "total_steps": 93654, "loss": 0.7904, "learning_rate": 1.7666886298210006e-06, "epoch": 2.6427061310782243, "percentage": 88.09, "elapsed_time": "4:38:21", "remaining_time": "0:37:38", "throughput": 40464.82, "total_tokens": 675840000} {"current_steps": 82600, "total_steps": 93654, "loss": 0.8547, "learning_rate": 1.735522609278742e-06, "epoch": 2.6459094112371067, "percentage": 88.2, "elapsed_time": "4:46:33", "remaining_time": "0:38:20", "throughput": 39355.9, "total_tokens": 676659200} {"current_steps": 82700, "total_steps": 93654, "loss": 0.8395, "learning_rate": 1.7046240520890655e-06, "epoch": 2.6491126913959895, "percentage": 88.3, "elapsed_time": "4:54:35", "remaining_time": "0:39:01", "throughput": 38328.85, "total_tokens": 677478400} {"current_steps": 82800, "total_steps": 93654, "loss": 0.8106, "learning_rate": 1.6739933134816117e-06, "epoch": 2.6523159715548723, "percentage": 88.41, "elapsed_time": "5:02:26", "remaining_time": "0:39:38", "throughput": 37378.6, "total_tokens": 678297600} {"current_steps": 82900, "total_steps": 93654, "loss": 0.8427, "learning_rate": 1.6436307456069832e-06, "epoch": 2.6555192517137547, "percentage": 88.52, "elapsed_time": "5:10:59", "remaining_time": "0:40:20", "throughput": 36395.65, "total_tokens": 679116800} {"current_steps": 83000, "total_steps": 93654, "loss": 0.8306, "learning_rate": 1.6135366975327442e-06, "epoch": 2.6587225318726375, "percentage": 88.62, "elapsed_time": "5:19:45", "remaining_time": "0:41:02", "throughput": 35439.56, "total_tokens": 679936000} {"current_steps": 83100, "total_steps": 93654, "loss": 0.8785, "learning_rate": 1.5837115152393695e-06, "epoch": 2.6619258120315203, "percentage": 88.73, "elapsed_time": "5:27:45", "remaining_time": "0:41:37", "throughput": 34617.13, "total_tokens": 680755200} {"current_steps": 83200, "total_steps": 93654, "loss": 0.7719, "learning_rate": 1.5541555416162784e-06, "epoch": 2.665129092190403, "percentage": 88.84, "elapsed_time": "5:36:00", "remaining_time": "0:42:13", "throughput": 33806.97, "total_tokens": 681574400} {"current_steps": 83300, "total_steps": 93654, "loss": 0.7945, "learning_rate": 1.5248691164579054e-06, "epoch": 2.6683323723492856, "percentage": 88.94, "elapsed_time": "5:43:55", "remaining_time": "0:42:44", "throughput": 33069.23, "total_tokens": 682393600} {"current_steps": 83400, "total_steps": 93654, "loss": 0.8751, "learning_rate": 1.4958525764597719e-06, "epoch": 2.6715356525081684, "percentage": 89.05, "elapsed_time": "5:51:40", "remaining_time": "0:43:14", "throughput": 32378.73, "total_tokens": 683212800} {"current_steps": 83500, "total_steps": 93654, "loss": 0.807, "learning_rate": 1.4671062552146342e-06, "epoch": 2.674738932667051, "percentage": 89.16, "elapsed_time": "5:59:29", "remaining_time": "0:43:42", "throughput": 31713.08, "total_tokens": 684032000} {"current_steps": 83600, "total_steps": 93654, "loss": 0.8519, "learning_rate": 1.4386304832086333e-06, "epoch": 2.6779422128259336, "percentage": 89.26, "elapsed_time": "6:07:22", "remaining_time": "0:44:10", "throughput": 31069.56, "total_tokens": 684851200} {"current_steps": 83700, "total_steps": 93654, "loss": 0.7911, "learning_rate": 1.4104255878175099e-06, "epoch": 2.6811454929848164, "percentage": 89.37, "elapsed_time": "6:15:09", "remaining_time": "0:44:36", "throughput": 30462.01, "total_tokens": 685670400} {"current_steps": 83800, "total_steps": 93654, "loss": 0.85, "learning_rate": 1.382491893302837e-06, "epoch": 2.6843487731436992, "percentage": 89.48, "elapsed_time": "6:23:08", "remaining_time": "0:45:03", "throughput": 29862.18, "total_tokens": 686489600} {"current_steps": 83900, "total_steps": 93654, "loss": 0.7469, "learning_rate": 1.3548297208082678e-06, "epoch": 2.687552053302582, "percentage": 89.59, "elapsed_time": "6:31:57", "remaining_time": "0:45:34", "throughput": 29225.52, "total_tokens": 687308800} {"current_steps": 84000, "total_steps": 93654, "loss": 0.815, "learning_rate": 1.3274393883558916e-06, "epoch": 2.6907553334614644, "percentage": 89.69, "elapsed_time": "6:40:36", "remaining_time": "0:46:02", "throughput": 28628.31, "total_tokens": 688128000} {"current_steps": 84100, "total_steps": 93654, "loss": 0.8195, "learning_rate": 1.3003212108425256e-06, "epoch": 2.6939586136203473, "percentage": 89.8, "elapsed_time": "6:48:44", "remaining_time": "0:46:26", "throughput": 28092.24, "total_tokens": 688947200} {"current_steps": 84200, "total_steps": 93654, "loss": 0.8265, "learning_rate": 1.2734755000361393e-06, "epoch": 2.6971618937792297, "percentage": 89.91, "elapsed_time": "6:56:49", "remaining_time": "0:46:48", "throughput": 27580.5, "total_tokens": 689766400} {"current_steps": 84300, "total_steps": 93654, "loss": 0.8382, "learning_rate": 1.2469025645722333e-06, "epoch": 2.7003651739381125, "percentage": 90.01, "elapsed_time": "7:04:54", "remaining_time": "0:47:08", "throughput": 27087.45, "total_tokens": 690585600} {"current_steps": 84400, "total_steps": 93654, "loss": 0.7791, "learning_rate": 1.2206027099503275e-06, "epoch": 2.7035684540969953, "percentage": 90.12, "elapsed_time": "7:13:19", "remaining_time": "0:47:30", "throughput": 26592.99, "total_tokens": 691404800} {"current_steps": 84500, "total_steps": 93654, "loss": 0.8321, "learning_rate": 1.1945762385304122e-06, "epoch": 2.706771734255878, "percentage": 90.23, "elapsed_time": "7:21:17", "remaining_time": "0:47:48", "throughput": 26143.51, "total_tokens": 692224000} {"current_steps": 84600, "total_steps": 93654, "loss": 0.8494, "learning_rate": 1.168823449529488e-06, "epoch": 2.709975014414761, "percentage": 90.33, "elapsed_time": "7:28:56", "remaining_time": "0:48:02", "throughput": 25728.72, "total_tokens": 693043200} {"current_steps": 84700, "total_steps": 93654, "loss": 0.8685, "learning_rate": 1.1433446390181402e-06, "epoch": 2.7131782945736433, "percentage": 90.44, "elapsed_time": "7:36:38", "remaining_time": "0:48:16", "throughput": 25325.16, "total_tokens": 693862400} {"current_steps": 84800, "total_steps": 93654, "loss": 0.8147, "learning_rate": 1.1181400999171144e-06, "epoch": 2.716381574732526, "percentage": 90.55, "elapsed_time": "7:44:16", "remaining_time": "0:48:28", "throughput": 24937.87, "total_tokens": 694681600} {"current_steps": 84900, "total_steps": 93654, "loss": 0.8259, "learning_rate": 1.0932101219939594e-06, "epoch": 2.7195848548914086, "percentage": 90.65, "elapsed_time": "7:52:09", "remaining_time": "0:48:41", "throughput": 24550.01, "total_tokens": 695500800} {"current_steps": 85000, "total_steps": 93654, "loss": 0.8737, "learning_rate": 1.0685549918596882e-06, "epoch": 2.7227881350502914, "percentage": 90.76, "elapsed_time": "7:59:57", "remaining_time": "0:48:51", "throughput": 24179.86, "total_tokens": 696320000} {"current_steps": 85100, "total_steps": 93654, "loss": 0.8358, "learning_rate": 1.0441749929654827e-06, "epoch": 2.725991415209174, "percentage": 90.87, "elapsed_time": "8:07:48", "remaining_time": "0:49:01", "throughput": 23819.1, "total_tokens": 697139200} {"current_steps": 85200, "total_steps": 93654, "loss": 0.8231, "learning_rate": 1.0200704055994548e-06, "epoch": 2.729194695368057, "percentage": 90.97, "elapsed_time": "8:15:33", "remaining_time": "0:49:10", "throughput": 23473.79, "total_tokens": 697958400} {"current_steps": 85300, "total_steps": 93654, "loss": 0.8211, "learning_rate": 9.962415068833968e-07, "epoch": 2.73239797552694, "percentage": 91.08, "elapsed_time": "8:23:18", "remaining_time": "0:49:17", "throughput": 23139.23, "total_tokens": 698777600} {"current_steps": 85400, "total_steps": 93654, "loss": 0.8776, "learning_rate": 9.726885707696114e-07, "epoch": 2.7356012556858222, "percentage": 91.19, "elapsed_time": "8:31:04", "remaining_time": "0:49:23", "throughput": 22814.34, "total_tokens": 699596800} {"current_steps": 85500, "total_steps": 93654, "loss": 0.8198, "learning_rate": 9.494118680377612e-07, "epoch": 2.738804535844705, "percentage": 91.29, "elapsed_time": "8:38:52", "remaining_time": "0:49:29", "throughput": 22497.59, "total_tokens": 700416000} {"current_steps": 85600, "total_steps": 93654, "loss": 0.8894, "learning_rate": 9.264116662917405e-07, "epoch": 2.7420078160035875, "percentage": 91.4, "elapsed_time": "8:46:48", "remaining_time": "0:49:34", "throughput": 22184.92, "total_tokens": 701235200} {"current_steps": 85700, "total_steps": 93654, "loss": 0.8259, "learning_rate": 9.036882299566229e-07, "epoch": 2.7452110961624703, "percentage": 91.51, "elapsed_time": "8:56:37", "remaining_time": "0:49:48", "throughput": 21804.93, "total_tokens": 702054400} {"current_steps": 85800, "total_steps": 93654, "loss": 0.7636, "learning_rate": 8.812418202756107e-07, "epoch": 2.748414376321353, "percentage": 91.61, "elapsed_time": "9:07:28", "remaining_time": "0:50:06", "throughput": 21397.49, "total_tokens": 702873600} {"current_steps": 85900, "total_steps": 93654, "loss": 0.8448, "learning_rate": 8.590726953070228e-07, "epoch": 2.751617656480236, "percentage": 91.72, "elapsed_time": "9:16:54", "remaining_time": "0:50:16", "throughput": 21059.76, "total_tokens": 703692800} {"current_steps": 86000, "total_steps": 93654, "loss": 0.8467, "learning_rate": 8.371811099213394e-07, "epoch": 2.7548209366391183, "percentage": 91.83, "elapsed_time": "9:26:12", "remaining_time": "0:50:23", "throughput": 20737.85, "total_tokens": 704512000} {"current_steps": 86100, "total_steps": 93654, "loss": 0.8133, "learning_rate": 8.155673157982601e-07, "epoch": 2.758024216798001, "percentage": 91.93, "elapsed_time": "9:33:51", "remaining_time": "0:50:20", "throughput": 20485.32, "total_tokens": 705331200} {"current_steps": 86200, "total_steps": 93654, "loss": 0.8109, "learning_rate": 7.942315614238277e-07, "epoch": 2.761227496956884, "percentage": 92.04, "elapsed_time": "9:41:28", "remaining_time": "0:50:16", "throughput": 20240.49, "total_tokens": 706150400} {"current_steps": 86300, "total_steps": 93654, "loss": 0.821, "learning_rate": 7.731740920875613e-07, "epoch": 2.7644307771157663, "percentage": 92.15, "elapsed_time": "9:49:05", "remaining_time": "0:50:11", "throughput": 20001.54, "total_tokens": 706969600} {"current_steps": 86400, "total_steps": 93654, "loss": 0.8135, "learning_rate": 7.523951498796283e-07, "epoch": 2.767634057274649, "percentage": 92.25, "elapsed_time": "9:56:43", "remaining_time": "0:50:06", "throughput": 19768.44, "total_tokens": 707788800} {"current_steps": 86500, "total_steps": 93654, "loss": 0.7905, "learning_rate": 7.318949736880798e-07, "epoch": 2.770837337433532, "percentage": 92.36, "elapsed_time": "10:04:18", "remaining_time": "0:49:58", "throughput": 19543.28, "total_tokens": 708608000} {"current_steps": 86600, "total_steps": 93654, "loss": 0.8608, "learning_rate": 7.116737991960831e-07, "epoch": 2.774040617592415, "percentage": 92.47, "elapsed_time": "10:11:54", "remaining_time": "0:49:50", "throughput": 19322.72, "total_tokens": 709427200} {"current_steps": 86700, "total_steps": 93654, "loss": 0.8586, "learning_rate": 6.917318588792299e-07, "epoch": 2.777243897751297, "percentage": 92.57, "elapsed_time": "10:19:33", "remaining_time": "0:49:41", "throughput": 19106.11, "total_tokens": 710246400} {"current_steps": 86800, "total_steps": 93654, "loss": 0.8473, "learning_rate": 6.720693820028629e-07, "epoch": 2.78044717791018, "percentage": 92.68, "elapsed_time": "10:27:09", "remaining_time": "0:49:31", "throughput": 18896.35, "total_tokens": 711065600} {"current_steps": 86900, "total_steps": 93654, "loss": 0.8182, "learning_rate": 6.526865946194172e-07, "epoch": 2.783650458069063, "percentage": 92.79, "elapsed_time": "10:34:45", "remaining_time": "0:49:20", "throughput": 18691.88, "total_tokens": 711884800} {"current_steps": 87000, "total_steps": 93654, "loss": 0.8493, "learning_rate": 6.335837195658528e-07, "epoch": 2.7868537382279452, "percentage": 92.9, "elapsed_time": "10:42:56", "remaining_time": "0:49:10", "throughput": 18474.86, "total_tokens": 712704000} {"current_steps": 87100, "total_steps": 93654, "loss": 0.8134, "learning_rate": 6.147609764610707e-07, "epoch": 2.790057018386828, "percentage": 93.0, "elapsed_time": "10:51:15", "remaining_time": "0:49:00", "throughput": 18260.13, "total_tokens": 713523200} {"current_steps": 87200, "total_steps": 93654, "loss": 0.7893, "learning_rate": 5.962185817034005e-07, "epoch": 2.793260298545711, "percentage": 93.11, "elapsed_time": "11:00:55", "remaining_time": "0:48:55", "throughput": 18013.85, "total_tokens": 714342400} {"current_steps": 87300, "total_steps": 93654, "loss": 0.7896, "learning_rate": 5.779567484681032e-07, "epoch": 2.7964635787045937, "percentage": 93.22, "elapsed_time": "11:12:41", "remaining_time": "0:48:57", "throughput": 17718.96, "total_tokens": 715161600} {"current_steps": 87400, "total_steps": 93654, "loss": 0.8185, "learning_rate": 5.599756867049221e-07, "epoch": 2.799666858863476, "percentage": 93.32, "elapsed_time": "11:24:15", "remaining_time": "0:48:57", "throughput": 17439.31, "total_tokens": 715980800} {"current_steps": 87500, "total_steps": 93654, "loss": 0.8188, "learning_rate": 5.422756031356779e-07, "epoch": 2.802870139022359, "percentage": 93.43, "elapsed_time": "11:35:58", "remaining_time": "0:48:56", "throughput": 17165.47, "total_tokens": 716800000} {"current_steps": 87600, "total_steps": 93654, "loss": 0.8303, "learning_rate": 5.248567012518857e-07, "epoch": 2.8060734191812418, "percentage": 93.54, "elapsed_time": "11:45:55", "remaining_time": "0:48:47", "throughput": 16942.57, "total_tokens": 717619200} {"current_steps": 87700, "total_steps": 93654, "loss": 0.7866, "learning_rate": 5.077191813124105e-07, "epoch": 2.809276699340124, "percentage": 93.64, "elapsed_time": "11:56:40", "remaining_time": "0:48:39", "throughput": 16707.85, "total_tokens": 718438400} {"current_steps": 87800, "total_steps": 93654, "loss": 0.8269, "learning_rate": 4.90863240341169e-07, "epoch": 2.812479979499007, "percentage": 93.75, "elapsed_time": "12:04:17", "remaining_time": "0:48:17", "throughput": 16550.74, "total_tokens": 719257600} {"current_steps": 87900, "total_steps": 93654, "loss": 0.7737, "learning_rate": 4.742890721248755e-07, "epoch": 2.81568325965789, "percentage": 93.86, "elapsed_time": "12:11:53", "remaining_time": "0:47:54", "throughput": 16397.47, "total_tokens": 720076800} {"current_steps": 88000, "total_steps": 93654, "loss": 0.8196, "learning_rate": 4.579968672107943e-07, "epoch": 2.8188865398167726, "percentage": 93.96, "elapsed_time": "12:19:30", "remaining_time": "0:47:30", "throughput": 16247.23, "total_tokens": 720896000} {"current_steps": 88100, "total_steps": 93654, "loss": 0.7998, "learning_rate": 4.419868129045629e-07, "epoch": 2.822089819975655, "percentage": 94.07, "elapsed_time": "12:27:08", "remaining_time": "0:47:06", "throughput": 16099.56, "total_tokens": 721715200} {"current_steps": 88200, "total_steps": 93654, "loss": 0.8535, "learning_rate": 4.2625909326803325e-07, "epoch": 2.825293100134538, "percentage": 94.18, "elapsed_time": "12:34:46", "remaining_time": "0:46:40", "throughput": 15954.83, "total_tokens": 722534400} {"current_steps": 88100, "total_steps": 93654, "loss": 0.7998, "learning_rate": 4.419868129045629e-07, "epoch": 2.822089819975655, "percentage": 94.07, "elapsed_time": "0:08:08", "remaining_time": "0:00:30", "throughput": 1477950.48, "total_tokens": 721715200} {"current_steps": 88200, "total_steps": 93654, "loss": 0.8534, "learning_rate": 4.2625909326803325e-07, "epoch": 2.825293100134538, "percentage": 94.18, "elapsed_time": "0:16:06", "remaining_time": "0:00:59", "throughput": 747875.39, "total_tokens": 722534400} {"current_steps": 88300, "total_steps": 93654, "loss": 0.8262, "learning_rate": 4.1081388911715645e-07, "epoch": 2.82849638029342, "percentage": 94.28, "elapsed_time": "0:24:05", "remaining_time": "0:01:27", "throughput": 500269.26, "total_tokens": 723353600} {"current_steps": 88400, "total_steps": 93654, "loss": 0.8323, "learning_rate": 3.9565137801990395e-07, "epoch": 2.831699660452303, "percentage": 94.39, "elapsed_time": "0:32:05", "remaining_time": "0:01:54", "throughput": 376144.14, "total_tokens": 724172800} {"current_steps": 88500, "total_steps": 93654, "loss": 0.8116, "learning_rate": 3.807717342942302e-07, "epoch": 2.834902940611186, "percentage": 94.5, "elapsed_time": "0:40:03", "remaining_time": "0:02:19", "throughput": 301671.05, "total_tokens": 724992000} {"current_steps": 88600, "total_steps": 93654, "loss": 0.8481, "learning_rate": 3.661751290060633e-07, "epoch": 2.8381062207700687, "percentage": 94.6, "elapsed_time": "0:48:02", "remaining_time": "0:02:44", "throughput": 251793.85, "total_tokens": 725811200} {"current_steps": 88700, "total_steps": 93654, "loss": 0.8084, "learning_rate": 3.5186172996733714e-07, "epoch": 2.8413095009289515, "percentage": 94.71, "elapsed_time": "0:55:57", "remaining_time": "0:03:07", "throughput": 216409.68, "total_tokens": 726630400} {"current_steps": 88800, "total_steps": 93654, "loss": 0.7923, "learning_rate": 3.3783170173406764e-07, "epoch": 2.844512781087834, "percentage": 94.82, "elapsed_time": "1:03:53", "remaining_time": "0:03:29", "throughput": 189737.84, "total_tokens": 727449600} {"current_steps": 88900, "total_steps": 93654, "loss": 0.8397, "learning_rate": 3.2408520560445463e-07, "epoch": 2.8477160612467167, "percentage": 94.92, "elapsed_time": "1:11:52", "remaining_time": "0:03:50", "throughput": 168870.1, "total_tokens": 728268800} {"current_steps": 89000, "total_steps": 93654, "loss": 0.7856, "learning_rate": 3.10622399617036e-07, "epoch": 2.850919341405599, "percentage": 95.03, "elapsed_time": "1:20:01", "remaining_time": "0:04:11", "throughput": 151830.97, "total_tokens": 729088000} {"current_steps": 89100, "total_steps": 93654, "loss": 0.8271, "learning_rate": 2.9744343854886393e-07, "epoch": 2.854122621564482, "percentage": 95.14, "elapsed_time": "1:29:34", "remaining_time": "0:04:34", "throughput": 135800.15, "total_tokens": 729907200} {"current_steps": 89200, "total_steps": 93654, "loss": 0.8334, "learning_rate": 2.8454847391372886e-07, "epoch": 2.8573259017233648, "percentage": 95.24, "elapsed_time": "1:37:45", "remaining_time": "0:04:52", "throughput": 124576.59, "total_tokens": 730726400} {"current_steps": 89300, "total_steps": 93654, "loss": 0.8198, "learning_rate": 2.719376539604107e-07, "epoch": 2.8605291818822476, "percentage": 95.35, "elapsed_time": "1:45:46", "remaining_time": "0:05:09", "throughput": 115270.01, "total_tokens": 731545600} {"current_steps": 89400, "total_steps": 93654, "loss": 0.8199, "learning_rate": 2.5961112367098306e-07, "epoch": 2.86373246204113, "percentage": 95.46, "elapsed_time": "1:53:44", "remaining_time": "0:05:24", "throughput": 107311.34, "total_tokens": 732364800} {"current_steps": 89500, "total_steps": 93654, "loss": 0.7963, "learning_rate": 2.4756902475914777e-07, "epoch": 2.866935742200013, "percentage": 95.56, "elapsed_time": "2:02:55", "remaining_time": "0:05:42", "throughput": 99409.89, "total_tokens": 733184000} {"current_steps": 89600, "total_steps": 93654, "loss": 0.8353, "learning_rate": 2.358114956685975e-07, "epoch": 2.8701390223588956, "percentage": 95.67, "elapsed_time": "2:12:05", "remaining_time": "0:05:58", "throughput": 92615.74, "total_tokens": 734003200} {"current_steps": 89700, "total_steps": 93654, "loss": 0.8547, "learning_rate": 2.243386715714224e-07, "epoch": 2.873342302517778, "percentage": 95.78, "elapsed_time": "2:21:01", "remaining_time": "0:06:12", "throughput": 86847.49, "total_tokens": 734822400} {"current_steps": 89800, "total_steps": 93654, "loss": 0.8233, "learning_rate": 2.1315068436656983e-07, "epoch": 2.876545582676661, "percentage": 95.88, "elapsed_time": "2:29:29", "remaining_time": "0:06:24", "throughput": 82017.57, "total_tokens": 735641600} {"current_steps": 89900, "total_steps": 93654, "loss": 0.8622, "learning_rate": 2.0224766267831207e-07, "epoch": 2.8797488628355437, "percentage": 95.99, "elapsed_time": "2:37:24", "remaining_time": "0:06:34", "throughput": 77976.7, "total_tokens": 736460800} {"current_steps": 90000, "total_steps": 93654, "loss": 0.789, "learning_rate": 1.9162973185478383e-07, "epoch": 2.8829521429944265, "percentage": 96.1, "elapsed_time": "2:46:03", "remaining_time": "0:06:44", "throughput": 73999.62, "total_tokens": 737280000} {"current_steps": 90100, "total_steps": 93654, "loss": 0.8723, "learning_rate": 1.8129701396652487e-07, "epoch": 2.886155423153309, "percentage": 96.21, "elapsed_time": "2:55:07", "remaining_time": "0:06:54", "throughput": 70244.32, "total_tokens": 738099200} {"current_steps": 90200, "total_steps": 93654, "loss": 0.8136, "learning_rate": 1.7124962780508957e-07, "epoch": 2.8893587033121917, "percentage": 96.31, "elapsed_time": "3:03:17", "remaining_time": "0:07:01", "throughput": 67187.52, "total_tokens": 738918400} {"current_steps": 90300, "total_steps": 93654, "loss": 0.8263, "learning_rate": 1.6148768888166744e-07, "epoch": 2.8925619834710745, "percentage": 96.42, "elapsed_time": "3:12:22", "remaining_time": "0:07:08", "throughput": 64089.22, "total_tokens": 739737600} {"current_steps": 90400, "total_steps": 93654, "loss": 0.8388, "learning_rate": 1.5201130942577578e-07, "epoch": 2.895765263629957, "percentage": 96.53, "elapsed_time": "3:21:44", "remaining_time": "0:07:15", "throughput": 61179.47, "total_tokens": 740556800} {"current_steps": 90500, "total_steps": 93654, "loss": 0.8284, "learning_rate": 1.4282059838394701e-07, "epoch": 2.8989685437888397, "percentage": 96.63, "elapsed_time": "3:32:29", "remaining_time": "0:07:24", "throughput": 58149.41, "total_tokens": 741376000} {"current_steps": 90600, "total_steps": 93654, "loss": 0.834, "learning_rate": 1.3391566141848778e-07, "epoch": 2.9021718239477226, "percentage": 96.74, "elapsed_time": "3:42:45", "remaining_time": "0:07:30", "throughput": 55530.76, "total_tokens": 742195200} {"current_steps": 90700, "total_steps": 93654, "loss": 0.8798, "learning_rate": 1.2529660090626894e-07, "epoch": 2.9053751041066054, "percentage": 96.85, "elapsed_time": "3:52:37", "remaining_time": "0:07:34", "throughput": 53233.95, "total_tokens": 743014400} {"current_steps": 90800, "total_steps": 93654, "loss": 0.8443, "learning_rate": 1.1696351593753485e-07, "epoch": 2.9085783842654878, "percentage": 96.95, "elapsed_time": "4:02:25", "remaining_time": "0:07:37", "throughput": 51137.26, "total_tokens": 743833600} {"current_steps": 90900, "total_steps": 93654, "loss": 0.7991, "learning_rate": 1.0891650231477646e-07, "epoch": 2.9117816644243706, "percentage": 97.06, "elapsed_time": "4:12:05", "remaining_time": "0:07:38", "throughput": 49231.53, "total_tokens": 744652800} {"current_steps": 91000, "total_steps": 93654, "loss": 0.8134, "learning_rate": 1.0115565255162107e-07, "epoch": 2.9149849445832534, "percentage": 97.17, "elapsed_time": "4:21:11", "remaining_time": "0:07:37", "throughput": 47568.44, "total_tokens": 745472000} {"current_steps": 91100, "total_steps": 93654, "loss": 0.855, "learning_rate": 9.368105587177767e-08, "epoch": 2.918188224742136, "percentage": 97.27, "elapsed_time": "4:31:00", "remaining_time": "0:07:35", "throughput": 45894.65, "total_tokens": 746291200} {"current_steps": 91200, "total_steps": 93654, "loss": 0.7894, "learning_rate": 8.649279820800161e-08, "epoch": 2.9213915049010186, "percentage": 97.38, "elapsed_time": "4:39:08", "remaining_time": "0:07:30", "throughput": 44608.73, "total_tokens": 747110400} {"current_steps": 91300, "total_steps": 93654, "loss": 0.8311, "learning_rate": 7.959096220111206e-08, "epoch": 2.9245947850599014, "percentage": 97.49, "elapsed_time": "4:46:50", "remaining_time": "0:07:23", "throughput": 43457.38, "total_tokens": 747929600} {"current_steps": 91400, "total_steps": 93654, "loss": 0.7856, "learning_rate": 7.297562719904561e-08, "epoch": 2.9277980652187843, "percentage": 97.59, "elapsed_time": "4:54:31", "remaining_time": "0:07:15", "throughput": 42370.19, "total_tokens": 748748800} {"current_steps": 91500, "total_steps": 93654, "loss": 0.8379, "learning_rate": 6.664686925593188e-08, "epoch": 2.9310013453776667, "percentage": 97.7, "elapsed_time": "5:02:36", "remaining_time": "0:07:07", "throughput": 41283.7, "total_tokens": 749568000} {"current_steps": 91600, "total_steps": 93654, "loss": 0.7529, "learning_rate": 6.060476113123603e-08, "epoch": 2.9342046255365495, "percentage": 97.81, "elapsed_time": "5:10:55", "remaining_time": "0:06:58", "throughput": 40224.13, "total_tokens": 750387200} {"current_steps": 91700, "total_steps": 93654, "loss": 0.8836, "learning_rate": 5.4849372288903744e-08, "epoch": 2.937407905695432, "percentage": 97.91, "elapsed_time": "5:19:14", "remaining_time": "0:06:48", "throughput": 39217.83, "total_tokens": 751206400} {"current_steps": 91800, "total_steps": 93654, "loss": 0.8253, "learning_rate": 4.9380768896578614e-08, "epoch": 2.9406111858543147, "percentage": 98.02, "elapsed_time": "5:27:19", "remaining_time": "0:06:36", "throughput": 38290.97, "total_tokens": 752025600} {"current_steps": 91900, "total_steps": 93654, "loss": 0.7867, "learning_rate": 4.419901382483327e-08, "epoch": 2.9438144660131975, "percentage": 98.13, "elapsed_time": "5:35:50", "remaining_time": "0:06:24", "throughput": 37360.97, "total_tokens": 752844800} {"current_steps": 92000, "total_steps": 93654, "loss": 0.8089, "learning_rate": 3.930416664644498e-08, "epoch": 2.9470177461720803, "percentage": 98.23, "elapsed_time": "5:44:18", "remaining_time": "0:06:11", "throughput": 36481.17, "total_tokens": 753664000} {"current_steps": 92100, "total_steps": 93654, "loss": 0.8324, "learning_rate": 3.469628363571564e-08, "epoch": 2.950221026330963, "percentage": 98.34, "elapsed_time": "5:52:49", "remaining_time": "0:05:57", "throughput": 35640.66, "total_tokens": 754483200} {"current_steps": 92200, "total_steps": 93654, "loss": 0.8199, "learning_rate": 3.037541776782782e-08, "epoch": 2.9534243064898456, "percentage": 98.45, "elapsed_time": "6:00:23", "remaining_time": "0:05:40", "throughput": 34930.23, "total_tokens": 755302400} {"current_steps": 92300, "total_steps": 93654, "loss": 0.8282, "learning_rate": 2.6341618718223048e-08, "epoch": 2.9566275866487284, "percentage": 98.55, "elapsed_time": "6:07:55", "remaining_time": "0:05:23", "throughput": 34250.99, "total_tokens": 756121600} {"current_steps": 92400, "total_steps": 93654, "loss": 0.823, "learning_rate": 2.2594932862041173e-08, "epoch": 2.9598308668076108, "percentage": 98.66, "elapsed_time": "6:15:32", "remaining_time": "0:05:05", "throughput": 33593.74, "total_tokens": 756940800} {"current_steps": 92500, "total_steps": 93654, "loss": 0.7854, "learning_rate": 1.91354032735902e-08, "epoch": 2.9630341469664936, "percentage": 98.77, "elapsed_time": "6:23:06", "remaining_time": "0:04:46", "throughput": 32966.07, "total_tokens": 757760000} {"current_steps": 92600, "total_steps": 93654, "loss": 0.8654, "learning_rate": 1.5963069725838385e-08, "epoch": 2.9662374271253764, "percentage": 98.87, "elapsed_time": "6:30:52", "remaining_time": "0:04:26", "throughput": 32345.7, "total_tokens": 758579200} {"current_steps": 92700, "total_steps": 93654, "loss": 0.7966, "learning_rate": 1.3077968689964582e-08, "epoch": 2.9694407072842592, "percentage": 98.98, "elapsed_time": "6:38:45", "remaining_time": "0:04:06", "throughput": 31739.88, "total_tokens": 759398400} {"current_steps": 92800, "total_steps": 93654, "loss": 0.8375, "learning_rate": 1.0480133334947462e-08, "epoch": 2.9726439874431416, "percentage": 99.09, "elapsed_time": "6:46:54", "remaining_time": "0:03:44", "throughput": 31138.04, "total_tokens": 760217600} {"current_steps": 92900, "total_steps": 93654, "loss": 0.8056, "learning_rate": 8.169593527160291e-09, "epoch": 2.9758472676020244, "percentage": 99.19, "elapsed_time": "6:54:48", "remaining_time": "0:03:22", "throughput": 30577.42, "total_tokens": 761036800} {"current_steps": 93000, "total_steps": 93654, "loss": 0.8026, "learning_rate": 6.146375830054507e-09, "epoch": 2.9790505477609073, "percentage": 99.3, "elapsed_time": "7:03:20", "remaining_time": "0:02:58", "throughput": 29993.59, "total_tokens": 761856000} {"current_steps": 93100, "total_steps": 93654, "loss": 0.8472, "learning_rate": 4.410503503840535e-09, "epoch": 2.9822538279197897, "percentage": 99.41, "elapsed_time": "7:12:47", "remaining_time": "0:02:34", "throughput": 29370.17, "total_tokens": 762675200} {"current_steps": 93200, "total_steps": 93654, "loss": 0.8558, "learning_rate": 2.961996505213005e-09, "epoch": 2.9854571080786725, "percentage": 99.52, "elapsed_time": "7:21:56", "remaining_time": "0:02:09", "throughput": 28793.39, "total_tokens": 763494400} {"current_steps": 93300, "total_steps": 93654, "loss": 0.8321, "learning_rate": 1.8008714871453613e-09, "epoch": 2.9886603882375553, "percentage": 99.62, "elapsed_time": "7:29:59", "remaining_time": "0:01:42", "throughput": 28308.71, "total_tokens": 764313600} {"current_steps": 93400, "total_steps": 93654, "loss": 0.8264, "learning_rate": 9.271417986705943e-10, "epoch": 2.991863668396438, "percentage": 99.73, "elapsed_time": "7:37:53", "remaining_time": "0:01:14", "throughput": 27849.62, "total_tokens": 765132800} {"current_steps": 93500, "total_steps": 93654, "loss": 0.7796, "learning_rate": 3.408174847480128e-10, "epoch": 2.9950669485553205, "percentage": 99.84, "elapsed_time": "7:45:53", "remaining_time": "0:00:46", "throughput": 27401.36, "total_tokens": 765952000} {"current_steps": 93600, "total_steps": 93654, "loss": 0.7863, "learning_rate": 4.1905286135568434e-11, "epoch": 2.9982702287142033, "percentage": 99.94, "elapsed_time": "7:55:10", "remaining_time": "0:00:16", "throughput": 26894.63, "total_tokens": 766771200} {"current_steps": 93654, "total_steps": 93654, "epoch": 3.0, "percentage": 100.0, "elapsed_time": "7:59:21", "remaining_time": "0:00:00", "throughput": 26674.59, "total_tokens": 767213568}