{"current_steps": 1, "total_steps": 1184, "loss": 4.6817, "learning_rate": 0.0, "epoch": 0.0033783783783783786, "percentage": 0.08, "elapsed_time": "0:00:12", "remaining_time": "4:16:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2, "total_steps": 1184, "loss": 4.5642, "learning_rate": 5.017166594399687e-06, "epoch": 0.006756756756756757, "percentage": 0.17, "elapsed_time": "0:00:18", "remaining_time": "2:58:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3, "total_steps": 1184, "loss": 4.787, "learning_rate": 7.952020911994375e-06, "epoch": 0.010135135135135136, "percentage": 0.25, "elapsed_time": "0:00:23", "remaining_time": "2:32:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4, "total_steps": 1184, "loss": 3.1422, "learning_rate": 1.0034333188799373e-05, "epoch": 0.013513513513513514, "percentage": 0.34, "elapsed_time": "0:00:28", "remaining_time": "2:19:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5, "total_steps": 1184, "loss": 1.9827, "learning_rate": 1.164950007226698e-05, "epoch": 0.016891891891891893, "percentage": 0.42, "elapsed_time": "0:00:33", "remaining_time": "2:11:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6, "total_steps": 1184, "loss": 1.0212, "learning_rate": 1.2969187506394062e-05, "epoch": 0.02027027027027027, "percentage": 0.51, "elapsed_time": "0:00:38", "remaining_time": "2:06:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7, "total_steps": 1184, "loss": 1.1823, "learning_rate": 1.4084967333570947e-05, "epoch": 0.02364864864864865, "percentage": 0.59, "elapsed_time": "0:00:43", "remaining_time": "2:02:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8, "total_steps": 1184, "loss": 0.7368, "learning_rate": 1.505149978319906e-05, "epoch": 0.02702702702702703, "percentage": 0.68, "elapsed_time": "0:00:48", "remaining_time": "1:59:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9, "total_steps": 1184, "loss": 0.6276, "learning_rate": 1.590404182398875e-05, "epoch": 0.030405405405405407, "percentage": 0.76, "elapsed_time": "0:00:53", "remaining_time": "1:57:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10, "total_steps": 1184, "loss": 0.5934, "learning_rate": 1.666666666666667e-05, "epoch": 0.033783783783783786, "percentage": 0.84, "elapsed_time": "0:00:59", "remaining_time": "1:55:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11, "total_steps": 1184, "loss": 0.6987, "learning_rate": 1.7356544752637084e-05, "epoch": 0.037162162162162164, "percentage": 0.93, "elapsed_time": "0:01:04", "remaining_time": "1:54:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12, "total_steps": 1184, "loss": 0.5722, "learning_rate": 1.7986354100793748e-05, "epoch": 0.04054054054054054, "percentage": 1.01, "elapsed_time": "0:01:09", "remaining_time": "1:52:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13, "total_steps": 1184, "loss": 0.5199, "learning_rate": 1.8565722538447282e-05, "epoch": 0.04391891891891892, "percentage": 1.1, "elapsed_time": "0:01:14", "remaining_time": "1:51:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14, "total_steps": 1184, "loss": 0.5063, "learning_rate": 1.9102133927970633e-05, "epoch": 0.0472972972972973, "percentage": 1.18, "elapsed_time": "0:01:19", "remaining_time": "1:50:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15, "total_steps": 1184, "loss": 0.5368, "learning_rate": 1.9601520984261358e-05, "epoch": 0.05067567567567568, "percentage": 1.27, "elapsed_time": "0:01:24", "remaining_time": "1:49:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16, "total_steps": 1184, "loss": 0.4682, "learning_rate": 2.0068666377598747e-05, "epoch": 0.05405405405405406, "percentage": 1.35, "elapsed_time": "0:01:29", "remaining_time": "1:49:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17, "total_steps": 1184, "loss": 0.4997, "learning_rate": 2.0507482022971233e-05, "epoch": 0.057432432432432436, "percentage": 1.44, "elapsed_time": "0:01:34", "remaining_time": "1:48:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 18, "total_steps": 1184, "loss": 0.4659, "learning_rate": 2.0921208418388435e-05, "epoch": 0.060810810810810814, "percentage": 1.52, "elapsed_time": "0:01:40", "remaining_time": "1:48:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 19, "total_steps": 1184, "loss": 0.4697, "learning_rate": 2.1312560015880482e-05, "epoch": 0.06418918918918919, "percentage": 1.6, "elapsed_time": "0:01:45", "remaining_time": "1:47:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 20, "total_steps": 1184, "loss": 0.4851, "learning_rate": 2.1683833261066357e-05, "epoch": 0.06756756756756757, "percentage": 1.69, "elapsed_time": "0:01:50", "remaining_time": "1:47:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 21, "total_steps": 1184, "loss": 0.4517, "learning_rate": 2.2036988245565324e-05, "epoch": 0.07094594594594594, "percentage": 1.77, "elapsed_time": "0:01:55", "remaining_time": "1:46:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 22, "total_steps": 1184, "loss": 0.4982, "learning_rate": 2.2373711347036773e-05, "epoch": 0.07432432432432433, "percentage": 1.86, "elapsed_time": "0:02:00", "remaining_time": "1:46:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 23, "total_steps": 1184, "loss": 0.4128, "learning_rate": 2.269546393362655e-05, "epoch": 0.0777027027027027, "percentage": 1.94, "elapsed_time": "0:02:05", "remaining_time": "1:45:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 24, "total_steps": 1184, "loss": 0.4281, "learning_rate": 2.3003520695193437e-05, "epoch": 0.08108108108108109, "percentage": 2.03, "elapsed_time": "0:02:11", "remaining_time": "1:45:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 25, "total_steps": 1184, "loss": 0.4407, "learning_rate": 2.329900014453396e-05, "epoch": 0.08445945945945946, "percentage": 2.11, "elapsed_time": "0:02:16", "remaining_time": "1:45:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 26, "total_steps": 1184, "loss": 0.4155, "learning_rate": 2.3582889132846968e-05, "epoch": 0.08783783783783784, "percentage": 2.2, "elapsed_time": "0:02:21", "remaining_time": "1:44:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 27, "total_steps": 1184, "loss": 0.4191, "learning_rate": 2.3856062735983123e-05, "epoch": 0.09121621621621621, "percentage": 2.28, "elapsed_time": "0:02:26", "remaining_time": "1:44:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 28, "total_steps": 1184, "loss": 0.4055, "learning_rate": 2.4119300522370322e-05, "epoch": 0.0945945945945946, "percentage": 2.36, "elapsed_time": "0:02:31", "remaining_time": "1:44:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 29, "total_steps": 1184, "loss": 0.4443, "learning_rate": 2.4373299964982603e-05, "epoch": 0.09797297297297297, "percentage": 2.45, "elapsed_time": "0:02:36", "remaining_time": "1:44:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 30, "total_steps": 1184, "loss": 0.4093, "learning_rate": 2.4618687578661044e-05, "epoch": 0.10135135135135136, "percentage": 2.53, "elapsed_time": "0:02:41", "remaining_time": "1:43:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 31, "total_steps": 1184, "loss": 0.4288, "learning_rate": 2.4856028230571212e-05, "epoch": 0.10472972972972973, "percentage": 2.62, "elapsed_time": "0:02:46", "remaining_time": "1:43:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 32, "total_steps": 1184, "loss": 0.4222, "learning_rate": 2.5085832971998436e-05, "epoch": 0.10810810810810811, "percentage": 2.7, "elapsed_time": "0:02:52", "remaining_time": "1:43:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 33, "total_steps": 1184, "loss": 0.416, "learning_rate": 2.530856566463146e-05, "epoch": 0.11148648648648649, "percentage": 2.79, "elapsed_time": "0:02:57", "remaining_time": "1:43:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 34, "total_steps": 1184, "loss": 0.3735, "learning_rate": 2.552464861737092e-05, "epoch": 0.11486486486486487, "percentage": 2.87, "elapsed_time": "0:03:02", "remaining_time": "1:42:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 35, "total_steps": 1184, "loss": 0.3315, "learning_rate": 2.5734467405837933e-05, "epoch": 0.11824324324324324, "percentage": 2.96, "elapsed_time": "0:03:07", "remaining_time": "1:42:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 36, "total_steps": 1184, "loss": 0.3652, "learning_rate": 2.5938375012788124e-05, "epoch": 0.12162162162162163, "percentage": 3.04, "elapsed_time": "0:03:12", "remaining_time": "1:42:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 37, "total_steps": 1184, "loss": 0.452, "learning_rate": 2.6136695401116585e-05, "epoch": 0.125, "percentage": 3.12, "elapsed_time": "0:03:17", "remaining_time": "1:42:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 38, "total_steps": 1184, "loss": 0.3328, "learning_rate": 2.6329726610280168e-05, "epoch": 0.12837837837837837, "percentage": 3.21, "elapsed_time": "0:03:22", "remaining_time": "1:41:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 39, "total_steps": 1184, "loss": 0.3987, "learning_rate": 2.651774345044166e-05, "epoch": 0.13175675675675674, "percentage": 3.29, "elapsed_time": "0:03:27", "remaining_time": "1:41:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 40, "total_steps": 1184, "loss": 0.3794, "learning_rate": 2.6700999855466042e-05, "epoch": 0.13513513513513514, "percentage": 3.38, "elapsed_time": "0:03:33", "remaining_time": "1:41:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 41, "total_steps": 1184, "loss": 0.4218, "learning_rate": 2.687973094532893e-05, "epoch": 0.13851351351351351, "percentage": 3.46, "elapsed_time": "0:03:38", "remaining_time": "1:41:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 42, "total_steps": 1184, "loss": 0.3788, "learning_rate": 2.7054154839965013e-05, "epoch": 0.14189189189189189, "percentage": 3.55, "elapsed_time": "0:03:43", "remaining_time": "1:41:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 43, "total_steps": 1184, "loss": 0.3946, "learning_rate": 2.722447425965978e-05, "epoch": 0.14527027027027026, "percentage": 3.63, "elapsed_time": "0:03:48", "remaining_time": "1:41:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 44, "total_steps": 1184, "loss": 0.389, "learning_rate": 2.739087794143646e-05, "epoch": 0.14864864864864866, "percentage": 3.72, "elapsed_time": "0:03:53", "remaining_time": "1:40:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 45, "total_steps": 1184, "loss": 0.399, "learning_rate": 2.755354189625573e-05, "epoch": 0.15202702702702703, "percentage": 3.8, "elapsed_time": "0:03:58", "remaining_time": "1:40:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 46, "total_steps": 1184, "loss": 0.3924, "learning_rate": 2.771263052802624e-05, "epoch": 0.1554054054054054, "percentage": 3.89, "elapsed_time": "0:04:03", "remaining_time": "1:40:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 47, "total_steps": 1184, "loss": 0.4111, "learning_rate": 2.7868297632261957e-05, "epoch": 0.15878378378378377, "percentage": 3.97, "elapsed_time": "0:04:08", "remaining_time": "1:40:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 48, "total_steps": 1184, "loss": 0.3958, "learning_rate": 2.8020687289593123e-05, "epoch": 0.16216216216216217, "percentage": 4.05, "elapsed_time": "0:04:14", "remaining_time": "1:40:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 49, "total_steps": 1184, "loss": 0.3844, "learning_rate": 2.8169934667141895e-05, "epoch": 0.16554054054054054, "percentage": 4.14, "elapsed_time": "0:04:19", "remaining_time": "1:40:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 50, "total_steps": 1184, "loss": 0.3847, "learning_rate": 2.8316166738933646e-05, "epoch": 0.16891891891891891, "percentage": 4.22, "elapsed_time": "0:04:24", "remaining_time": "1:39:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 51, "total_steps": 1184, "loss": 0.4043, "learning_rate": 2.845950293496561e-05, "epoch": 0.17229729729729729, "percentage": 4.31, "elapsed_time": "0:04:29", "remaining_time": "1:39:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 52, "total_steps": 1184, "loss": 0.3806, "learning_rate": 2.8600055727246657e-05, "epoch": 0.17567567567567569, "percentage": 4.39, "elapsed_time": "0:04:34", "remaining_time": "1:39:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 53, "total_steps": 1184, "loss": 0.416, "learning_rate": 2.8737931160013153e-05, "epoch": 0.17905405405405406, "percentage": 4.48, "elapsed_time": "0:04:39", "remaining_time": "1:39:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 54, "total_steps": 1184, "loss": 0.3548, "learning_rate": 2.8873229330382812e-05, "epoch": 0.18243243243243243, "percentage": 4.56, "elapsed_time": "0:04:44", "remaining_time": "1:39:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 55, "total_steps": 1184, "loss": 0.3982, "learning_rate": 2.9006044824904066e-05, "epoch": 0.1858108108108108, "percentage": 4.65, "elapsed_time": "0:04:49", "remaining_time": "1:39:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 56, "total_steps": 1184, "loss": 0.3536, "learning_rate": 2.913646711677001e-05, "epoch": 0.1891891891891892, "percentage": 4.73, "elapsed_time": "0:04:55", "remaining_time": "1:39:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 57, "total_steps": 1184, "loss": 0.3594, "learning_rate": 2.926458092787486e-05, "epoch": 0.19256756756756757, "percentage": 4.81, "elapsed_time": "0:05:00", "remaining_time": "1:38:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 58, "total_steps": 1184, "loss": 0.3725, "learning_rate": 2.939046655938229e-05, "epoch": 0.19594594594594594, "percentage": 4.9, "elapsed_time": "0:05:05", "remaining_time": "1:38:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 59, "total_steps": 1184, "loss": 0.3896, "learning_rate": 2.951420019403574e-05, "epoch": 0.19932432432432431, "percentage": 4.98, "elapsed_time": "0:05:10", "remaining_time": "1:38:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 60, "total_steps": 1184, "loss": 0.3633, "learning_rate": 2.963585417306073e-05, "epoch": 0.20270270270270271, "percentage": 5.07, "elapsed_time": "0:05:15", "remaining_time": "1:38:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 61, "total_steps": 1184, "loss": 0.3447, "learning_rate": 2.9755497250179453e-05, "epoch": 0.20608108108108109, "percentage": 5.15, "elapsed_time": "0:05:20", "remaining_time": "1:38:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 62, "total_steps": 1184, "loss": 0.3851, "learning_rate": 2.98731948249709e-05, "epoch": 0.20945945945945946, "percentage": 5.24, "elapsed_time": "0:05:25", "remaining_time": "1:38:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 63, "total_steps": 1184, "loss": 0.3896, "learning_rate": 2.9989009157559694e-05, "epoch": 0.21283783783783783, "percentage": 5.32, "elapsed_time": "0:05:30", "remaining_time": "1:38:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 64, "total_steps": 1184, "loss": 0.4528, "learning_rate": 3.010299956639812e-05, "epoch": 0.21621621621621623, "percentage": 5.41, "elapsed_time": "0:05:36", "remaining_time": "1:38:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 65, "total_steps": 1184, "loss": 0.3151, "learning_rate": 3.021522261071426e-05, "epoch": 0.2195945945945946, "percentage": 5.49, "elapsed_time": "0:05:41", "remaining_time": "1:37:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 66, "total_steps": 1184, "loss": 0.3501, "learning_rate": 3.0325732259031143e-05, "epoch": 0.22297297297297297, "percentage": 5.57, "elapsed_time": "0:05:46", "remaining_time": "1:37:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 67, "total_steps": 1184, "loss": 0.3383, "learning_rate": 3.043458004501377e-05, "epoch": 0.22635135135135134, "percentage": 5.66, "elapsed_time": "0:05:51", "remaining_time": "1:37:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 68, "total_steps": 1184, "loss": 0.3559, "learning_rate": 3.054181521177061e-05, "epoch": 0.22972972972972974, "percentage": 5.74, "elapsed_time": "0:05:56", "remaining_time": "1:37:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 69, "total_steps": 1184, "loss": 0.3951, "learning_rate": 3.064748484562093e-05, "epoch": 0.23310810810810811, "percentage": 5.83, "elapsed_time": "0:06:01", "remaining_time": "1:37:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 70, "total_steps": 1184, "loss": 0.3759, "learning_rate": 3.0751634000237615e-05, "epoch": 0.23648648648648649, "percentage": 5.91, "elapsed_time": "0:06:06", "remaining_time": "1:37:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 71, "total_steps": 1184, "loss": 0.409, "learning_rate": 3.085430581198459e-05, "epoch": 0.23986486486486486, "percentage": 6.0, "elapsed_time": "0:06:11", "remaining_time": "1:37:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 72, "total_steps": 1184, "loss": 0.3938, "learning_rate": 3.095554160718781e-05, "epoch": 0.24324324324324326, "percentage": 6.08, "elapsed_time": "0:06:17", "remaining_time": "1:37:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 73, "total_steps": 1184, "loss": 0.3657, "learning_rate": 3.10553810020076e-05, "epoch": 0.24662162162162163, "percentage": 6.17, "elapsed_time": "0:06:22", "remaining_time": "1:36:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 74, "total_steps": 1184, "loss": 0.3743, "learning_rate": 3.115386199551628e-05, "epoch": 0.25, "percentage": 6.25, "elapsed_time": "0:06:27", "remaining_time": "1:36:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 75, "total_steps": 1184, "loss": 0.3188, "learning_rate": 3.1251021056528336e-05, "epoch": 0.2533783783783784, "percentage": 6.33, "elapsed_time": "0:06:32", "remaining_time": "1:36:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 76, "total_steps": 1184, "loss": 0.3622, "learning_rate": 3.134689320467986e-05, "epoch": 0.25675675675675674, "percentage": 6.42, "elapsed_time": "0:06:37", "remaining_time": "1:36:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 77, "total_steps": 1184, "loss": 0.3768, "learning_rate": 3.144151208620804e-05, "epoch": 0.26013513513513514, "percentage": 6.5, "elapsed_time": "0:06:42", "remaining_time": "1:36:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 78, "total_steps": 1184, "loss": 0.3655, "learning_rate": 3.1534910044841344e-05, "epoch": 0.2635135135135135, "percentage": 6.59, "elapsed_time": "0:06:47", "remaining_time": "1:36:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 79, "total_steps": 1184, "loss": 0.358, "learning_rate": 3.1627118188174024e-05, "epoch": 0.2668918918918919, "percentage": 6.67, "elapsed_time": "0:06:53", "remaining_time": "1:36:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 80, "total_steps": 1184, "loss": 0.3579, "learning_rate": 3.171816644986573e-05, "epoch": 0.2702702702702703, "percentage": 6.76, "elapsed_time": "0:06:58", "remaining_time": "1:36:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 81, "total_steps": 1184, "loss": 0.3916, "learning_rate": 3.18080836479775e-05, "epoch": 0.27364864864864863, "percentage": 6.84, "elapsed_time": "0:07:03", "remaining_time": "1:36:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 82, "total_steps": 1184, "loss": 0.3768, "learning_rate": 3.1896897539728616e-05, "epoch": 0.27702702702702703, "percentage": 6.93, "elapsed_time": "0:07:08", "remaining_time": "1:35:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 83, "total_steps": 1184, "loss": 0.3709, "learning_rate": 3.198463487293457e-05, "epoch": 0.28040540540540543, "percentage": 7.01, "elapsed_time": "0:07:13", "remaining_time": "1:35:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 84, "total_steps": 1184, "loss": 0.3871, "learning_rate": 3.207132143436469e-05, "epoch": 0.28378378378378377, "percentage": 7.09, "elapsed_time": "0:07:18", "remaining_time": "1:35:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 85, "total_steps": 1184, "loss": 0.3632, "learning_rate": 3.215698209523821e-05, "epoch": 0.28716216216216217, "percentage": 7.18, "elapsed_time": "0:07:23", "remaining_time": "1:35:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 86, "total_steps": 1184, "loss": 0.3788, "learning_rate": 3.224164085405946e-05, "epoch": 0.2905405405405405, "percentage": 7.26, "elapsed_time": "0:07:28", "remaining_time": "1:35:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 87, "total_steps": 1184, "loss": 0.3472, "learning_rate": 3.232532087697698e-05, "epoch": 0.2939189189189189, "percentage": 7.35, "elapsed_time": "0:07:34", "remaining_time": "1:35:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 88, "total_steps": 1184, "loss": 0.3815, "learning_rate": 3.240804453583615e-05, "epoch": 0.2972972972972973, "percentage": 7.43, "elapsed_time": "0:07:39", "remaining_time": "1:35:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 89, "total_steps": 1184, "loss": 0.3374, "learning_rate": 3.248983344408188e-05, "epoch": 0.30067567567567566, "percentage": 7.52, "elapsed_time": "0:07:44", "remaining_time": "1:35:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 90, "total_steps": 1184, "loss": 0.3503, "learning_rate": 3.2570708490655414e-05, "epoch": 0.30405405405405406, "percentage": 7.6, "elapsed_time": "0:07:49", "remaining_time": "1:35:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 91, "total_steps": 1184, "loss": 0.3699, "learning_rate": 3.265068987201822e-05, "epoch": 0.30743243243243246, "percentage": 7.69, "elapsed_time": "0:07:54", "remaining_time": "1:34:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 92, "total_steps": 1184, "loss": 0.3702, "learning_rate": 3.2729797122425925e-05, "epoch": 0.3108108108108108, "percentage": 7.77, "elapsed_time": "0:07:59", "remaining_time": "1:34:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 93, "total_steps": 1184, "loss": 0.333, "learning_rate": 3.280804914256559e-05, "epoch": 0.3141891891891892, "percentage": 7.85, "elapsed_time": "0:08:04", "remaining_time": "1:34:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 94, "total_steps": 1184, "loss": 0.329, "learning_rate": 3.288546422666164e-05, "epoch": 0.31756756756756754, "percentage": 7.94, "elapsed_time": "0:08:09", "remaining_time": "1:34:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 95, "total_steps": 1184, "loss": 0.3931, "learning_rate": 3.2962060088147464e-05, "epoch": 0.32094594594594594, "percentage": 8.02, "elapsed_time": "0:08:15", "remaining_time": "1:34:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 96, "total_steps": 1184, "loss": 0.3432, "learning_rate": 3.3037853883992805e-05, "epoch": 0.32432432432432434, "percentage": 8.11, "elapsed_time": "0:08:20", "remaining_time": "1:34:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 97, "total_steps": 1184, "loss": 0.3508, "learning_rate": 3.3112862237770756e-05, "epoch": 0.3277027027027027, "percentage": 8.19, "elapsed_time": "0:08:25", "remaining_time": "1:34:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 98, "total_steps": 1184, "loss": 0.372, "learning_rate": 3.3187101261541584e-05, "epoch": 0.3310810810810811, "percentage": 8.28, "elapsed_time": "0:08:30", "remaining_time": "1:34:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 99, "total_steps": 1184, "loss": 0.3832, "learning_rate": 3.326058657662584e-05, "epoch": 0.3344594594594595, "percentage": 8.36, "elapsed_time": "0:08:35", "remaining_time": "1:34:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 100, "total_steps": 1184, "loss": 0.3553, "learning_rate": 3.333333333333334e-05, "epoch": 0.33783783783783783, "percentage": 8.45, "elapsed_time": "0:08:40", "remaining_time": "1:34:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 101, "total_steps": 1184, "loss": 0.3448, "learning_rate": 3.340535622971072e-05, "epoch": 0.34121621621621623, "percentage": 8.53, "elapsed_time": "0:08:45", "remaining_time": "1:33:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 102, "total_steps": 1184, "loss": 0.3367, "learning_rate": 3.3476669529365295e-05, "epoch": 0.34459459459459457, "percentage": 8.61, "elapsed_time": "0:08:50", "remaining_time": "1:33:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 103, "total_steps": 1184, "loss": 0.3786, "learning_rate": 3.3547287078419544e-05, "epoch": 0.34797297297297297, "percentage": 8.7, "elapsed_time": "0:08:56", "remaining_time": "1:33:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 104, "total_steps": 1184, "loss": 0.352, "learning_rate": 3.361722232164634e-05, "epoch": 0.35135135135135137, "percentage": 8.78, "elapsed_time": "0:09:01", "remaining_time": "1:33:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 105, "total_steps": 1184, "loss": 0.3473, "learning_rate": 3.3686488317832306e-05, "epoch": 0.3547297297297297, "percentage": 8.87, "elapsed_time": "0:09:06", "remaining_time": "1:33:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 106, "total_steps": 1184, "loss": 0.2945, "learning_rate": 3.375509775441284e-05, "epoch": 0.3581081081081081, "percentage": 8.95, "elapsed_time": "0:09:11", "remaining_time": "1:33:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 107, "total_steps": 1184, "loss": 0.313, "learning_rate": 3.382306296142016e-05, "epoch": 0.3614864864864865, "percentage": 9.04, "elapsed_time": "0:09:16", "remaining_time": "1:33:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 108, "total_steps": 1184, "loss": 0.3367, "learning_rate": 3.38903959247825e-05, "epoch": 0.36486486486486486, "percentage": 9.12, "elapsed_time": "0:09:21", "remaining_time": "1:33:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 109, "total_steps": 1184, "loss": 0.3639, "learning_rate": 3.395710829901039e-05, "epoch": 0.36824324324324326, "percentage": 9.21, "elapsed_time": "0:09:26", "remaining_time": "1:33:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 110, "total_steps": 1184, "loss": 0.3523, "learning_rate": 3.402321141930376e-05, "epoch": 0.3716216216216216, "percentage": 9.29, "elapsed_time": "0:09:31", "remaining_time": "1:33:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 111, "total_steps": 1184, "loss": 0.3418, "learning_rate": 3.4088716313110955e-05, "epoch": 0.375, "percentage": 9.38, "elapsed_time": "0:09:37", "remaining_time": "1:32:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 112, "total_steps": 1184, "loss": 0.3208, "learning_rate": 3.415363371116969e-05, "epoch": 0.3783783783783784, "percentage": 9.46, "elapsed_time": "0:09:42", "remaining_time": "1:32:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 113, "total_steps": 1184, "loss": 0.3412, "learning_rate": 3.4217974058057e-05, "epoch": 0.38175675675675674, "percentage": 9.54, "elapsed_time": "0:09:47", "remaining_time": "1:32:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 114, "total_steps": 1184, "loss": 0.3615, "learning_rate": 3.428174752227455e-05, "epoch": 0.38513513513513514, "percentage": 9.63, "elapsed_time": "0:09:52", "remaining_time": "1:32:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 115, "total_steps": 1184, "loss": 0.3171, "learning_rate": 3.434496400589353e-05, "epoch": 0.3885135135135135, "percentage": 9.71, "elapsed_time": "0:09:57", "remaining_time": "1:32:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 116, "total_steps": 1184, "loss": 0.315, "learning_rate": 3.440763315378198e-05, "epoch": 0.3918918918918919, "percentage": 9.8, "elapsed_time": "0:10:02", "remaining_time": "1:32:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 117, "total_steps": 1184, "loss": 0.3117, "learning_rate": 3.446976436243603e-05, "epoch": 0.3952702702702703, "percentage": 9.88, "elapsed_time": "0:10:07", "remaining_time": "1:32:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 118, "total_steps": 1184, "loss": 0.3192, "learning_rate": 3.4531366788435425e-05, "epoch": 0.39864864864864863, "percentage": 9.97, "elapsed_time": "0:10:12", "remaining_time": "1:32:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 119, "total_steps": 1184, "loss": 0.3353, "learning_rate": 3.459244935654219e-05, "epoch": 0.40202702702702703, "percentage": 10.05, "elapsed_time": "0:10:18", "remaining_time": "1:32:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 120, "total_steps": 1184, "loss": 0.3572, "learning_rate": 3.465302076746041e-05, "epoch": 0.40540540540540543, "percentage": 10.14, "elapsed_time": "0:10:23", "remaining_time": "1:32:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 121, "total_steps": 1184, "loss": 0.3217, "learning_rate": 3.471308950527417e-05, "epoch": 0.40878378378378377, "percentage": 10.22, "elapsed_time": "0:10:28", "remaining_time": "1:32:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 122, "total_steps": 1184, "loss": 0.3214, "learning_rate": 3.477266384457914e-05, "epoch": 0.41216216216216217, "percentage": 10.3, "elapsed_time": "0:10:33", "remaining_time": "1:31:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 123, "total_steps": 1184, "loss": 0.3332, "learning_rate": 3.48317518573233e-05, "epoch": 0.4155405405405405, "percentage": 10.39, "elapsed_time": "0:10:38", "remaining_time": "1:31:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 124, "total_steps": 1184, "loss": 0.354, "learning_rate": 3.489036141937059e-05, "epoch": 0.4189189189189189, "percentage": 10.47, "elapsed_time": "0:10:43", "remaining_time": "1:31:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 125, "total_steps": 1184, "loss": 0.353, "learning_rate": 3.494850021680094e-05, "epoch": 0.4222972972972973, "percentage": 10.56, "elapsed_time": "0:10:48", "remaining_time": "1:31:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 126, "total_steps": 1184, "loss": 0.3065, "learning_rate": 3.500617575195938e-05, "epoch": 0.42567567567567566, "percentage": 10.64, "elapsed_time": "0:10:54", "remaining_time": "1:31:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 127, "total_steps": 1184, "loss": 0.3329, "learning_rate": 3.5063395349265945e-05, "epoch": 0.42905405405405406, "percentage": 10.73, "elapsed_time": "0:10:59", "remaining_time": "1:31:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 128, "total_steps": 1184, "loss": 0.3476, "learning_rate": 3.5120166160797804e-05, "epoch": 0.43243243243243246, "percentage": 10.81, "elapsed_time": "0:11:04", "remaining_time": "1:31:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 129, "total_steps": 1184, "loss": 0.3517, "learning_rate": 3.517649517165415e-05, "epoch": 0.4358108108108108, "percentage": 10.9, "elapsed_time": "0:11:09", "remaining_time": "1:31:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 130, "total_steps": 1184, "loss": 0.3417, "learning_rate": 3.523238920511395e-05, "epoch": 0.4391891891891892, "percentage": 10.98, "elapsed_time": "0:11:14", "remaining_time": "1:31:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 131, "total_steps": 1184, "loss": 0.3543, "learning_rate": 3.528785492759607e-05, "epoch": 0.44256756756756754, "percentage": 11.06, "elapsed_time": "0:11:19", "remaining_time": "1:31:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 132, "total_steps": 1184, "loss": 0.3552, "learning_rate": 3.5342898853430836e-05, "epoch": 0.44594594594594594, "percentage": 11.15, "elapsed_time": "0:11:24", "remaining_time": "1:30:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 133, "total_steps": 1184, "loss": 0.3469, "learning_rate": 3.539752734945143e-05, "epoch": 0.44932432432432434, "percentage": 11.23, "elapsed_time": "0:11:29", "remaining_time": "1:30:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 134, "total_steps": 1184, "loss": 0.294, "learning_rate": 3.5451746639413466e-05, "epoch": 0.4527027027027027, "percentage": 11.32, "elapsed_time": "0:11:35", "remaining_time": "1:30:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 135, "total_steps": 1184, "loss": 0.2557, "learning_rate": 3.550556280825011e-05, "epoch": 0.4560810810810811, "percentage": 11.4, "elapsed_time": "0:11:40", "remaining_time": "1:30:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 136, "total_steps": 1184, "loss": 0.2885, "learning_rate": 3.55589818061703e-05, "epoch": 0.4594594594594595, "percentage": 11.49, "elapsed_time": "0:11:45", "remaining_time": "1:30:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 137, "total_steps": 1184, "loss": 0.3436, "learning_rate": 3.561200945260678e-05, "epoch": 0.46283783783783783, "percentage": 11.57, "elapsed_time": "0:11:50", "remaining_time": "1:30:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 138, "total_steps": 1184, "loss": 0.2865, "learning_rate": 3.5664651440020616e-05, "epoch": 0.46621621621621623, "percentage": 11.66, "elapsed_time": "0:11:55", "remaining_time": "1:30:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 139, "total_steps": 1184, "loss": 0.3394, "learning_rate": 3.571691333756825e-05, "epoch": 0.46959459459459457, "percentage": 11.74, "elapsed_time": "0:12:00", "remaining_time": "1:30:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 140, "total_steps": 1184, "loss": 0.3278, "learning_rate": 3.5768800594637304e-05, "epoch": 0.47297297297297297, "percentage": 11.82, "elapsed_time": "0:12:05", "remaining_time": "1:30:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 141, "total_steps": 1184, "loss": 0.3343, "learning_rate": 3.582031854425634e-05, "epoch": 0.47635135135135137, "percentage": 11.91, "elapsed_time": "0:12:11", "remaining_time": "1:30:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 142, "total_steps": 1184, "loss": 0.3079, "learning_rate": 3.587147240638428e-05, "epoch": 0.4797297297297297, "percentage": 11.99, "elapsed_time": "0:12:16", "remaining_time": "1:30:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 143, "total_steps": 1184, "loss": 0.3305, "learning_rate": 3.5922267291084366e-05, "epoch": 0.4831081081081081, "percentage": 12.08, "elapsed_time": "0:12:21", "remaining_time": "1:29:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 144, "total_steps": 1184, "loss": 0.3242, "learning_rate": 3.5972708201587496e-05, "epoch": 0.4864864864864865, "percentage": 12.16, "elapsed_time": "0:12:26", "remaining_time": "1:29:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 145, "total_steps": 1184, "loss": 0.3341, "learning_rate": 3.6022800037249585e-05, "epoch": 0.48986486486486486, "percentage": 12.25, "elapsed_time": "0:12:31", "remaining_time": "1:29:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 146, "total_steps": 1184, "loss": 0.31, "learning_rate": 3.607254759640729e-05, "epoch": 0.49324324324324326, "percentage": 12.33, "elapsed_time": "0:12:36", "remaining_time": "1:29:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 147, "total_steps": 1184, "loss": 0.3048, "learning_rate": 3.612195557913627e-05, "epoch": 0.4966216216216216, "percentage": 12.42, "elapsed_time": "0:12:41", "remaining_time": "1:29:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 148, "total_steps": 1184, "loss": 0.3266, "learning_rate": 3.6171028589915954e-05, "epoch": 0.5, "percentage": 12.5, "elapsed_time": "0:12:46", "remaining_time": "1:29:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 149, "total_steps": 1184, "loss": 0.3509, "learning_rate": 3.6219771140204575e-05, "epoch": 0.5033783783783784, "percentage": 12.58, "elapsed_time": "0:12:52", "remaining_time": "1:29:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 150, "total_steps": 1184, "loss": 0.3348, "learning_rate": 3.626818765092802e-05, "epoch": 0.5067567567567568, "percentage": 12.67, "elapsed_time": "0:12:57", "remaining_time": "1:29:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 151, "total_steps": 1184, "loss": 0.3218, "learning_rate": 3.6316282454886157e-05, "epoch": 0.5101351351351351, "percentage": 12.75, "elapsed_time": "0:13:02", "remaining_time": "1:29:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 152, "total_steps": 1184, "loss": 0.347, "learning_rate": 3.636405979907955e-05, "epoch": 0.5135135135135135, "percentage": 12.84, "elapsed_time": "0:13:07", "remaining_time": "1:29:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 153, "total_steps": 1184, "loss": 0.2618, "learning_rate": 3.6411523846959985e-05, "epoch": 0.5168918918918919, "percentage": 12.92, "elapsed_time": "0:13:12", "remaining_time": "1:29:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 154, "total_steps": 1184, "loss": 0.3364, "learning_rate": 3.645867868060772e-05, "epoch": 0.5202702702702703, "percentage": 13.01, "elapsed_time": "0:13:17", "remaining_time": "1:28:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 155, "total_steps": 1184, "loss": 0.327, "learning_rate": 3.6505528302838193e-05, "epoch": 0.5236486486486487, "percentage": 13.09, "elapsed_time": "0:13:22", "remaining_time": "1:28:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 156, "total_steps": 1184, "loss": 0.3008, "learning_rate": 3.6552076639241027e-05, "epoch": 0.527027027027027, "percentage": 13.18, "elapsed_time": "0:13:27", "remaining_time": "1:28:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 157, "total_steps": 1184, "loss": 0.3153, "learning_rate": 3.65983275401539e-05, "epoch": 0.5304054054054054, "percentage": 13.26, "elapsed_time": "0:13:33", "remaining_time": "1:28:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 158, "total_steps": 1184, "loss": 0.3409, "learning_rate": 3.664428478257371e-05, "epoch": 0.5337837837837838, "percentage": 13.34, "elapsed_time": "0:13:38", "remaining_time": "1:28:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 159, "total_steps": 1184, "loss": 0.3295, "learning_rate": 3.668995207200753e-05, "epoch": 0.5371621621621622, "percentage": 13.43, "elapsed_time": "0:13:43", "remaining_time": "1:28:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 160, "total_steps": 1184, "loss": 0.3522, "learning_rate": 3.673533304426541e-05, "epoch": 0.5405405405405406, "percentage": 13.51, "elapsed_time": "0:13:48", "remaining_time": "1:28:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 161, "total_steps": 1184, "loss": 0.3322, "learning_rate": 3.67804312671975e-05, "epoch": 0.543918918918919, "percentage": 13.6, "elapsed_time": "0:13:53", "remaining_time": "1:28:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 162, "total_steps": 1184, "loss": 0.3283, "learning_rate": 3.682525024237719e-05, "epoch": 0.5472972972972973, "percentage": 13.68, "elapsed_time": "0:13:58", "remaining_time": "1:28:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 163, "total_steps": 1184, "loss": 0.3104, "learning_rate": 3.6869793406732636e-05, "epoch": 0.5506756756756757, "percentage": 13.77, "elapsed_time": "0:14:03", "remaining_time": "1:28:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 164, "total_steps": 1184, "loss": 0.3292, "learning_rate": 3.69140641341283e-05, "epoch": 0.5540540540540541, "percentage": 13.85, "elapsed_time": "0:14:09", "remaining_time": "1:28:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 165, "total_steps": 1184, "loss": 0.3183, "learning_rate": 3.695806573689844e-05, "epoch": 0.5574324324324325, "percentage": 13.94, "elapsed_time": "0:14:14", "remaining_time": "1:27:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 166, "total_steps": 1184, "loss": 0.2935, "learning_rate": 3.700180146733426e-05, "epoch": 0.5608108108108109, "percentage": 14.02, "elapsed_time": "0:14:19", "remaining_time": "1:27:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 167, "total_steps": 1184, "loss": 0.3249, "learning_rate": 3.704527451912639e-05, "epoch": 0.5641891891891891, "percentage": 14.1, "elapsed_time": "0:14:24", "remaining_time": "1:27:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 168, "total_steps": 1184, "loss": 0.3128, "learning_rate": 3.708848802876438e-05, "epoch": 0.5675675675675675, "percentage": 14.19, "elapsed_time": "0:14:29", "remaining_time": "1:27:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 169, "total_steps": 1184, "loss": 0.2882, "learning_rate": 3.7131445076894564e-05, "epoch": 0.5709459459459459, "percentage": 14.27, "elapsed_time": "0:14:34", "remaining_time": "1:27:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 170, "total_steps": 1184, "loss": 0.3268, "learning_rate": 3.717414868963791e-05, "epoch": 0.5743243243243243, "percentage": 14.36, "elapsed_time": "0:14:39", "remaining_time": "1:27:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 171, "total_steps": 1184, "loss": 0.3161, "learning_rate": 3.721660183986924e-05, "epoch": 0.5777027027027027, "percentage": 14.44, "elapsed_time": "0:14:44", "remaining_time": "1:27:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 172, "total_steps": 1184, "loss": 0.2942, "learning_rate": 3.725880744845915e-05, "epoch": 0.581081081081081, "percentage": 14.53, "elapsed_time": "0:14:50", "remaining_time": "1:27:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 173, "total_steps": 1184, "loss": 0.3232, "learning_rate": 3.730076838547993e-05, "epoch": 0.5844594594594594, "percentage": 14.61, "elapsed_time": "0:14:55", "remaining_time": "1:27:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 174, "total_steps": 1184, "loss": 0.3115, "learning_rate": 3.734248747137666e-05, "epoch": 0.5878378378378378, "percentage": 14.7, "elapsed_time": "0:15:00", "remaining_time": "1:27:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 175, "total_steps": 1184, "loss": 0.3245, "learning_rate": 3.738396747810492e-05, "epoch": 0.5912162162162162, "percentage": 14.78, "elapsed_time": "0:15:05", "remaining_time": "1:27:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 176, "total_steps": 1184, "loss": 0.3152, "learning_rate": 3.7425211130235834e-05, "epoch": 0.5945945945945946, "percentage": 14.86, "elapsed_time": "0:15:10", "remaining_time": "1:26:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 177, "total_steps": 1184, "loss": 0.3115, "learning_rate": 3.7466221106030115e-05, "epoch": 0.597972972972973, "percentage": 14.95, "elapsed_time": "0:15:15", "remaining_time": "1:26:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 178, "total_steps": 1184, "loss": 0.2948, "learning_rate": 3.750700003848157e-05, "epoch": 0.6013513513513513, "percentage": 15.03, "elapsed_time": "0:15:20", "remaining_time": "1:26:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 179, "total_steps": 1184, "loss": 0.337, "learning_rate": 3.7547550516331555e-05, "epoch": 0.6047297297297297, "percentage": 15.12, "elapsed_time": "0:15:25", "remaining_time": "1:26:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 180, "total_steps": 1184, "loss": 0.3244, "learning_rate": 3.75878750850551e-05, "epoch": 0.6081081081081081, "percentage": 15.2, "elapsed_time": "0:15:31", "remaining_time": "1:26:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 181, "total_steps": 1184, "loss": 0.3173, "learning_rate": 3.7627976247819744e-05, "epoch": 0.6114864864864865, "percentage": 15.29, "elapsed_time": "0:15:36", "remaining_time": "1:26:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 182, "total_steps": 1184, "loss": 0.3087, "learning_rate": 3.766785646641792e-05, "epoch": 0.6148648648648649, "percentage": 15.37, "elapsed_time": "0:15:41", "remaining_time": "1:26:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 183, "total_steps": 1184, "loss": 0.3261, "learning_rate": 3.770751816217383e-05, "epoch": 0.6182432432432432, "percentage": 15.46, "elapsed_time": "0:15:46", "remaining_time": "1:26:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 184, "total_steps": 1184, "loss": 0.3239, "learning_rate": 3.7746963716825615e-05, "epoch": 0.6216216216216216, "percentage": 15.54, "elapsed_time": "0:15:51", "remaining_time": "1:26:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 185, "total_steps": 1184, "loss": 0.3082, "learning_rate": 3.778619547338356e-05, "epoch": 0.625, "percentage": 15.62, "elapsed_time": "0:15:56", "remaining_time": "1:26:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 186, "total_steps": 1184, "loss": 0.2753, "learning_rate": 3.782521573696528e-05, "epoch": 0.6283783783783784, "percentage": 15.71, "elapsed_time": "0:16:01", "remaining_time": "1:26:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 187, "total_steps": 1184, "loss": 0.3033, "learning_rate": 3.786402677560832e-05, "epoch": 0.6317567567567568, "percentage": 15.79, "elapsed_time": "0:16:07", "remaining_time": "1:25:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 188, "total_steps": 1184, "loss": 0.3171, "learning_rate": 3.790263082106134e-05, "epoch": 0.6351351351351351, "percentage": 15.88, "elapsed_time": "0:16:12", "remaining_time": "1:25:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 189, "total_steps": 1184, "loss": 0.2927, "learning_rate": 3.794103006955407e-05, "epoch": 0.6385135135135135, "percentage": 15.96, "elapsed_time": "0:16:17", "remaining_time": "1:25:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 190, "total_steps": 1184, "loss": 0.2885, "learning_rate": 3.797922668254715e-05, "epoch": 0.6418918918918919, "percentage": 16.05, "elapsed_time": "0:16:22", "remaining_time": "1:25:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 191, "total_steps": 1184, "loss": 0.3379, "learning_rate": 3.801722278746213e-05, "epoch": 0.6452702702702703, "percentage": 16.13, "elapsed_time": "0:16:27", "remaining_time": "1:25:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 192, "total_steps": 1184, "loss": 0.3091, "learning_rate": 3.8055020478392495e-05, "epoch": 0.6486486486486487, "percentage": 16.22, "elapsed_time": "0:16:32", "remaining_time": "1:25:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 193, "total_steps": 1184, "loss": 0.3758, "learning_rate": 3.809262181679623e-05, "epoch": 0.652027027027027, "percentage": 16.3, "elapsed_time": "0:16:37", "remaining_time": "1:25:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 194, "total_steps": 1184, "loss": 0.3044, "learning_rate": 3.813002883217044e-05, "epoch": 0.6554054054054054, "percentage": 16.39, "elapsed_time": "0:16:42", "remaining_time": "1:25:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 195, "total_steps": 1184, "loss": 0.3556, "learning_rate": 3.816724352270863e-05, "epoch": 0.6587837837837838, "percentage": 16.47, "elapsed_time": "0:16:48", "remaining_time": "1:25:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 196, "total_steps": 1184, "loss": 0.3352, "learning_rate": 3.8204267855941266e-05, "epoch": 0.6621621621621622, "percentage": 16.55, "elapsed_time": "0:16:53", "remaining_time": "1:25:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 197, "total_steps": 1184, "loss": 0.3328, "learning_rate": 3.824110376935989e-05, "epoch": 0.6655405405405406, "percentage": 16.64, "elapsed_time": "0:16:58", "remaining_time": "1:25:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 198, "total_steps": 1184, "loss": 0.296, "learning_rate": 3.827775317102552e-05, "epoch": 0.668918918918919, "percentage": 16.72, "elapsed_time": "0:17:03", "remaining_time": "1:24:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 199, "total_steps": 1184, "loss": 0.3049, "learning_rate": 3.831421794016178e-05, "epoch": 0.6722972972972973, "percentage": 16.81, "elapsed_time": "0:17:08", "remaining_time": "1:24:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 200, "total_steps": 1184, "loss": 0.3133, "learning_rate": 3.835049992773302e-05, "epoch": 0.6756756756756757, "percentage": 16.89, "elapsed_time": "0:17:13", "remaining_time": "1:24:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 201, "total_steps": 1184, "loss": 0.3185, "learning_rate": 3.838660095700815e-05, "epoch": 0.6790540540540541, "percentage": 16.98, "elapsed_time": "0:17:18", "remaining_time": "1:24:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 202, "total_steps": 1184, "loss": 0.302, "learning_rate": 3.84225228241104e-05, "epoch": 0.6824324324324325, "percentage": 17.06, "elapsed_time": "0:17:23", "remaining_time": "1:24:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 203, "total_steps": 1184, "loss": 0.3407, "learning_rate": 3.8458267298553554e-05, "epoch": 0.6858108108108109, "percentage": 17.15, "elapsed_time": "0:17:29", "remaining_time": "1:24:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 204, "total_steps": 1184, "loss": 0.2858, "learning_rate": 3.8493836123764984e-05, "epoch": 0.6891891891891891, "percentage": 17.23, "elapsed_time": "0:17:34", "remaining_time": "1:24:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 205, "total_steps": 1184, "loss": 0.3638, "learning_rate": 3.852923101759591e-05, "epoch": 0.6925675675675675, "percentage": 17.31, "elapsed_time": "0:17:39", "remaining_time": "1:24:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 206, "total_steps": 1184, "loss": 0.3077, "learning_rate": 3.856445367281923e-05, "epoch": 0.6959459459459459, "percentage": 17.4, "elapsed_time": "0:17:44", "remaining_time": "1:24:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 207, "total_steps": 1184, "loss": 0.2791, "learning_rate": 3.859950575761529e-05, "epoch": 0.6993243243243243, "percentage": 17.48, "elapsed_time": "0:17:49", "remaining_time": "1:24:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 208, "total_steps": 1184, "loss": 0.3404, "learning_rate": 3.8634388916046025e-05, "epoch": 0.7027027027027027, "percentage": 17.57, "elapsed_time": "0:17:54", "remaining_time": "1:24:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 209, "total_steps": 1184, "loss": 0.2859, "learning_rate": 3.866910476851757e-05, "epoch": 0.706081081081081, "percentage": 17.65, "elapsed_time": "0:17:59", "remaining_time": "1:23:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 210, "total_steps": 1184, "loss": 0.3224, "learning_rate": 3.870365491223199e-05, "epoch": 0.7094594594594594, "percentage": 17.74, "elapsed_time": "0:18:04", "remaining_time": "1:23:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 211, "total_steps": 1184, "loss": 0.3225, "learning_rate": 3.8738040921628215e-05, "epoch": 0.7128378378378378, "percentage": 17.82, "elapsed_time": "0:18:10", "remaining_time": "1:23:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 212, "total_steps": 1184, "loss": 0.3294, "learning_rate": 3.877226434881253e-05, "epoch": 0.7162162162162162, "percentage": 17.91, "elapsed_time": "0:18:15", "remaining_time": "1:23:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 213, "total_steps": 1184, "loss": 0.3035, "learning_rate": 3.880632672397897e-05, "epoch": 0.7195945945945946, "percentage": 17.99, "elapsed_time": "0:18:20", "remaining_time": "1:23:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 214, "total_steps": 1184, "loss": 0.3261, "learning_rate": 3.884022955581985e-05, "epoch": 0.722972972972973, "percentage": 18.07, "elapsed_time": "0:18:25", "remaining_time": "1:23:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 215, "total_steps": 1184, "loss": 0.2926, "learning_rate": 3.887397433192676e-05, "epoch": 0.7263513513513513, "percentage": 18.16, "elapsed_time": "0:18:30", "remaining_time": "1:23:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 216, "total_steps": 1184, "loss": 0.2808, "learning_rate": 3.890756251918219e-05, "epoch": 0.7297297297297297, "percentage": 18.24, "elapsed_time": "0:18:35", "remaining_time": "1:23:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 217, "total_steps": 1184, "loss": 0.2995, "learning_rate": 3.894099556414216e-05, "epoch": 0.7331081081081081, "percentage": 18.33, "elapsed_time": "0:18:40", "remaining_time": "1:23:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 218, "total_steps": 1184, "loss": 0.3054, "learning_rate": 3.897427489341009e-05, "epoch": 0.7364864864864865, "percentage": 18.41, "elapsed_time": "0:18:46", "remaining_time": "1:23:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 219, "total_steps": 1184, "loss": 0.3239, "learning_rate": 3.900740191400198e-05, "epoch": 0.7398648648648649, "percentage": 18.5, "elapsed_time": "0:18:51", "remaining_time": "1:23:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 220, "total_steps": 1184, "loss": 0.3215, "learning_rate": 3.904037801370344e-05, "epoch": 0.7432432432432432, "percentage": 18.58, "elapsed_time": "0:18:56", "remaining_time": "1:22:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 221, "total_steps": 1184, "loss": 0.2829, "learning_rate": 3.9073204561418514e-05, "epoch": 0.7466216216216216, "percentage": 18.67, "elapsed_time": "0:19:01", "remaining_time": "1:22:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 222, "total_steps": 1184, "loss": 0.3052, "learning_rate": 3.9105882907510644e-05, "epoch": 0.75, "percentage": 18.75, "elapsed_time": "0:19:06", "remaining_time": "1:22:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 223, "total_steps": 1184, "loss": 0.3259, "learning_rate": 3.913841438413601e-05, "epoch": 0.7533783783783784, "percentage": 18.83, "elapsed_time": "0:19:11", "remaining_time": "1:22:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 224, "total_steps": 1184, "loss": 0.3252, "learning_rate": 3.917080030556938e-05, "epoch": 0.7567567567567568, "percentage": 18.92, "elapsed_time": "0:19:16", "remaining_time": "1:22:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 225, "total_steps": 1184, "loss": 0.3252, "learning_rate": 3.9203041968522716e-05, "epoch": 0.7601351351351351, "percentage": 19.0, "elapsed_time": "0:19:21", "remaining_time": "1:22:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 226, "total_steps": 1184, "loss": 0.3185, "learning_rate": 3.923514065245669e-05, "epoch": 0.7635135135135135, "percentage": 19.09, "elapsed_time": "0:19:27", "remaining_time": "1:22:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 227, "total_steps": 1184, "loss": 0.3136, "learning_rate": 3.926709761988538e-05, "epoch": 0.7668918918918919, "percentage": 19.17, "elapsed_time": "0:19:32", "remaining_time": "1:22:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 228, "total_steps": 1184, "loss": 0.2977, "learning_rate": 3.929891411667424e-05, "epoch": 0.7702702702702703, "percentage": 19.26, "elapsed_time": "0:19:37", "remaining_time": "1:22:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 229, "total_steps": 1184, "loss": 0.3031, "learning_rate": 3.933059137233147e-05, "epoch": 0.7736486486486487, "percentage": 19.34, "elapsed_time": "0:19:42", "remaining_time": "1:22:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 230, "total_steps": 1184, "loss": 0.3292, "learning_rate": 3.9362130600293214e-05, "epoch": 0.777027027027027, "percentage": 19.43, "elapsed_time": "0:19:47", "remaining_time": "1:22:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 231, "total_steps": 1184, "loss": 0.3014, "learning_rate": 3.9393532998202405e-05, "epoch": 0.7804054054054054, "percentage": 19.51, "elapsed_time": "0:19:52", "remaining_time": "1:22:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 232, "total_steps": 1184, "loss": 0.2804, "learning_rate": 3.942479974818166e-05, "epoch": 0.7837837837837838, "percentage": 19.59, "elapsed_time": "0:19:57", "remaining_time": "1:21:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 233, "total_steps": 1184, "loss": 0.3243, "learning_rate": 3.945593201710032e-05, "epoch": 0.7871621621621622, "percentage": 19.68, "elapsed_time": "0:20:02", "remaining_time": "1:21:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 234, "total_steps": 1184, "loss": 0.2907, "learning_rate": 3.9486930956835724e-05, "epoch": 0.7905405405405406, "percentage": 19.76, "elapsed_time": "0:20:08", "remaining_time": "1:21:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 235, "total_steps": 1184, "loss": 0.3265, "learning_rate": 3.951779770452894e-05, "epoch": 0.793918918918919, "percentage": 19.85, "elapsed_time": "0:20:13", "remaining_time": "1:21:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 236, "total_steps": 1184, "loss": 0.3194, "learning_rate": 3.954853338283512e-05, "epoch": 0.7972972972972973, "percentage": 19.93, "elapsed_time": "0:20:18", "remaining_time": "1:21:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 237, "total_steps": 1184, "loss": 0.2857, "learning_rate": 3.9579139100168404e-05, "epoch": 0.8006756756756757, "percentage": 20.02, "elapsed_time": "0:20:23", "remaining_time": "1:21:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 238, "total_steps": 1184, "loss": 0.2843, "learning_rate": 3.960961595094187e-05, "epoch": 0.8040540540540541, "percentage": 20.1, "elapsed_time": "0:20:28", "remaining_time": "1:21:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 239, "total_steps": 1184, "loss": 0.2755, "learning_rate": 3.96399650158023e-05, "epoch": 0.8074324324324325, "percentage": 20.19, "elapsed_time": "0:20:33", "remaining_time": "1:21:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 240, "total_steps": 1184, "loss": 0.3015, "learning_rate": 3.96701873618601e-05, "epoch": 0.8108108108108109, "percentage": 20.27, "elapsed_time": "0:20:38", "remaining_time": "1:21:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 241, "total_steps": 1184, "loss": 0.2911, "learning_rate": 3.970028404291448e-05, "epoch": 0.8141891891891891, "percentage": 20.35, "elapsed_time": "0:20:43", "remaining_time": "1:21:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 242, "total_steps": 1184, "loss": 0.3093, "learning_rate": 3.9730256099673865e-05, "epoch": 0.8175675675675675, "percentage": 20.44, "elapsed_time": "0:20:49", "remaining_time": "1:21:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 243, "total_steps": 1184, "loss": 0.3078, "learning_rate": 3.976010455997187e-05, "epoch": 0.8209459459459459, "percentage": 20.52, "elapsed_time": "0:20:54", "remaining_time": "1:20:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 244, "total_steps": 1184, "loss": 0.2723, "learning_rate": 3.978983043897883e-05, "epoch": 0.8243243243243243, "percentage": 20.61, "elapsed_time": "0:20:59", "remaining_time": "1:20:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 245, "total_steps": 1184, "loss": 0.3161, "learning_rate": 3.981943473940888e-05, "epoch": 0.8277027027027027, "percentage": 20.69, "elapsed_time": "0:21:04", "remaining_time": "1:20:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 246, "total_steps": 1184, "loss": 0.3002, "learning_rate": 3.984891845172299e-05, "epoch": 0.831081081081081, "percentage": 20.78, "elapsed_time": "0:21:09", "remaining_time": "1:20:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 247, "total_steps": 1184, "loss": 0.3614, "learning_rate": 3.987828255432777e-05, "epoch": 0.8344594594594594, "percentage": 20.86, "elapsed_time": "0:21:14", "remaining_time": "1:20:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 248, "total_steps": 1184, "loss": 0.3226, "learning_rate": 3.9907528013770276e-05, "epoch": 0.8378378378378378, "percentage": 20.95, "elapsed_time": "0:21:19", "remaining_time": "1:20:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 249, "total_steps": 1184, "loss": 0.289, "learning_rate": 3.993665578492894e-05, "epoch": 0.8412162162162162, "percentage": 21.03, "elapsed_time": "0:21:24", "remaining_time": "1:20:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 250, "total_steps": 1184, "loss": 0.3346, "learning_rate": 3.9965666811200624e-05, "epoch": 0.8445945945945946, "percentage": 21.11, "elapsed_time": "0:21:30", "remaining_time": "1:20:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 251, "total_steps": 1184, "loss": 0.3526, "learning_rate": 3.999456202468397e-05, "epoch": 0.847972972972973, "percentage": 21.2, "elapsed_time": "0:35:19", "remaining_time": "2:11:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 252, "total_steps": 1184, "loss": 0.3086, "learning_rate": 4.002334234635907e-05, "epoch": 0.8513513513513513, "percentage": 21.28, "elapsed_time": "0:35:24", "remaining_time": "2:10:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 253, "total_steps": 1184, "loss": 0.3578, "learning_rate": 4.005200868626364e-05, "epoch": 0.8547297297297297, "percentage": 21.37, "elapsed_time": "0:35:29", "remaining_time": "2:10:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 254, "total_steps": 1184, "loss": 0.3166, "learning_rate": 4.008056194366564e-05, "epoch": 0.8581081081081081, "percentage": 21.45, "elapsed_time": "0:35:34", "remaining_time": "2:10:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 255, "total_steps": 1184, "loss": 0.2969, "learning_rate": 4.010900300723259e-05, "epoch": 0.8614864864864865, "percentage": 21.54, "elapsed_time": "0:35:39", "remaining_time": "2:09:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 256, "total_steps": 1184, "loss": 0.3341, "learning_rate": 4.013733275519749e-05, "epoch": 0.8648648648648649, "percentage": 21.62, "elapsed_time": "0:35:44", "remaining_time": "2:09:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 257, "total_steps": 1184, "loss": 0.2942, "learning_rate": 4.016555205552158e-05, "epoch": 0.8682432432432432, "percentage": 21.71, "elapsed_time": "0:35:49", "remaining_time": "2:09:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 258, "total_steps": 1184, "loss": 0.2668, "learning_rate": 4.0193661766053834e-05, "epoch": 0.8716216216216216, "percentage": 21.79, "elapsed_time": "0:35:54", "remaining_time": "2:08:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 259, "total_steps": 1184, "loss": 0.3424, "learning_rate": 4.022166273468753e-05, "epoch": 0.875, "percentage": 21.88, "elapsed_time": "0:35:59", "remaining_time": "2:08:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 260, "total_steps": 1184, "loss": 0.2906, "learning_rate": 4.024955579951363e-05, "epoch": 0.8783783783783784, "percentage": 21.96, "elapsed_time": "0:36:05", "remaining_time": "2:08:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 261, "total_steps": 1184, "loss": 0.3307, "learning_rate": 4.027734178897136e-05, "epoch": 0.8817567567567568, "percentage": 22.04, "elapsed_time": "0:36:10", "remaining_time": "2:07:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 262, "total_steps": 1184, "loss": 0.2569, "learning_rate": 4.030502152199576e-05, "epoch": 0.8851351351351351, "percentage": 22.13, "elapsed_time": "0:36:15", "remaining_time": "2:07:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 263, "total_steps": 1184, "loss": 0.2925, "learning_rate": 4.033259580816264e-05, "epoch": 0.8885135135135135, "percentage": 22.21, "elapsed_time": "0:36:20", "remaining_time": "2:07:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 264, "total_steps": 1184, "loss": 0.3058, "learning_rate": 4.036006544783052e-05, "epoch": 0.8918918918918919, "percentage": 22.3, "elapsed_time": "0:36:25", "remaining_time": "2:06:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 265, "total_steps": 1184, "loss": 0.2952, "learning_rate": 4.0387431232280135e-05, "epoch": 0.8952702702702703, "percentage": 22.38, "elapsed_time": "0:36:30", "remaining_time": "2:06:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 266, "total_steps": 1184, "loss": 0.2873, "learning_rate": 4.041469394385112e-05, "epoch": 0.8986486486486487, "percentage": 22.47, "elapsed_time": "0:36:35", "remaining_time": "2:06:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 267, "total_steps": 1184, "loss": 0.2747, "learning_rate": 4.0441854356076257e-05, "epoch": 0.902027027027027, "percentage": 22.55, "elapsed_time": "0:36:40", "remaining_time": "2:05:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 268, "total_steps": 1184, "loss": 0.3157, "learning_rate": 4.046891323381315e-05, "epoch": 0.9054054054054054, "percentage": 22.64, "elapsed_time": "0:36:45", "remaining_time": "2:05:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 269, "total_steps": 1184, "loss": 0.3139, "learning_rate": 4.049587133337347e-05, "epoch": 0.9087837837837838, "percentage": 22.72, "elapsed_time": "0:36:51", "remaining_time": "2:05:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 270, "total_steps": 1184, "loss": 0.3122, "learning_rate": 4.0522729402649793e-05, "epoch": 0.9121621621621622, "percentage": 22.8, "elapsed_time": "0:36:56", "remaining_time": "2:05:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 271, "total_steps": 1184, "loss": 0.3101, "learning_rate": 4.0549488181240096e-05, "epoch": 0.9155405405405406, "percentage": 22.89, "elapsed_time": "0:37:01", "remaining_time": "2:04:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 272, "total_steps": 1184, "loss": 0.3087, "learning_rate": 4.057614840056998e-05, "epoch": 0.918918918918919, "percentage": 22.97, "elapsed_time": "0:37:06", "remaining_time": "2:04:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 273, "total_steps": 1184, "loss": 0.3044, "learning_rate": 4.06027107840126e-05, "epoch": 0.9222972972972973, "percentage": 23.06, "elapsed_time": "0:37:11", "remaining_time": "2:04:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 274, "total_steps": 1184, "loss": 0.2929, "learning_rate": 4.0629176047006474e-05, "epoch": 0.9256756756756757, "percentage": 23.14, "elapsed_time": "0:37:16", "remaining_time": "2:03:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 275, "total_steps": 1184, "loss": 0.321, "learning_rate": 4.065554489717105e-05, "epoch": 0.9290540540540541, "percentage": 23.23, "elapsed_time": "0:37:21", "remaining_time": "2:03:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 276, "total_steps": 1184, "loss": 0.3026, "learning_rate": 4.068181803442029e-05, "epoch": 0.9324324324324325, "percentage": 23.31, "elapsed_time": "0:37:26", "remaining_time": "2:03:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 277, "total_steps": 1184, "loss": 0.2876, "learning_rate": 4.0707996151074147e-05, "epoch": 0.9358108108108109, "percentage": 23.4, "elapsed_time": "0:37:31", "remaining_time": "2:02:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 278, "total_steps": 1184, "loss": 0.2968, "learning_rate": 4.073407993196794e-05, "epoch": 0.9391891891891891, "percentage": 23.48, "elapsed_time": "0:37:37", "remaining_time": "2:02:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 279, "total_steps": 1184, "loss": 0.3144, "learning_rate": 4.076007005455996e-05, "epoch": 0.9425675675675675, "percentage": 23.56, "elapsed_time": "0:37:42", "remaining_time": "2:02:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 280, "total_steps": 1184, "loss": 0.3103, "learning_rate": 4.0785967189036986e-05, "epoch": 0.9459459459459459, "percentage": 23.65, "elapsed_time": "0:37:47", "remaining_time": "2:02:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 281, "total_steps": 1184, "loss": 0.3136, "learning_rate": 4.0811771998418e-05, "epoch": 0.9493243243243243, "percentage": 23.73, "elapsed_time": "0:37:52", "remaining_time": "2:01:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 282, "total_steps": 1184, "loss": 0.335, "learning_rate": 4.083748513865602e-05, "epoch": 0.9527027027027027, "percentage": 23.82, "elapsed_time": "0:37:57", "remaining_time": "2:01:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 283, "total_steps": 1184, "loss": 0.3036, "learning_rate": 4.086310725873818e-05, "epoch": 0.956081081081081, "percentage": 23.9, "elapsed_time": "0:38:02", "remaining_time": "2:01:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 284, "total_steps": 1184, "loss": 0.2827, "learning_rate": 4.0888639000783966e-05, "epoch": 0.9594594594594594, "percentage": 23.99, "elapsed_time": "0:38:07", "remaining_time": "2:00:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 285, "total_steps": 1184, "loss": 0.3162, "learning_rate": 4.0914081000141844e-05, "epoch": 0.9628378378378378, "percentage": 24.07, "elapsed_time": "0:38:12", "remaining_time": "2:00:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 286, "total_steps": 1184, "loss": 0.2992, "learning_rate": 4.0939433885484055e-05, "epoch": 0.9662162162162162, "percentage": 24.16, "elapsed_time": "0:38:18", "remaining_time": "2:00:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 287, "total_steps": 1184, "loss": 0.278, "learning_rate": 4.0964698278899874e-05, "epoch": 0.9695945945945946, "percentage": 24.24, "elapsed_time": "0:38:23", "remaining_time": "1:59:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 288, "total_steps": 1184, "loss": 0.3023, "learning_rate": 4.0989874795987185e-05, "epoch": 0.972972972972973, "percentage": 24.32, "elapsed_time": "0:38:28", "remaining_time": "1:59:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 289, "total_steps": 1184, "loss": 0.2806, "learning_rate": 4.1014964045942465e-05, "epoch": 0.9763513513513513, "percentage": 24.41, "elapsed_time": "0:38:33", "remaining_time": "1:59:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 290, "total_steps": 1184, "loss": 0.3078, "learning_rate": 4.103996663164927e-05, "epoch": 0.9797297297297297, "percentage": 24.49, "elapsed_time": "0:38:38", "remaining_time": "1:59:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 291, "total_steps": 1184, "loss": 0.3048, "learning_rate": 4.106488314976513e-05, "epoch": 0.9831081081081081, "percentage": 24.58, "elapsed_time": "0:38:44", "remaining_time": "1:58:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 292, "total_steps": 1184, "loss": 0.305, "learning_rate": 4.108971419080698e-05, "epoch": 0.9864864864864865, "percentage": 24.66, "elapsed_time": "0:38:49", "remaining_time": "1:58:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 293, "total_steps": 1184, "loss": 0.3027, "learning_rate": 4.111446033923516e-05, "epoch": 0.9898648648648649, "percentage": 24.75, "elapsed_time": "0:38:54", "remaining_time": "1:58:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 294, "total_steps": 1184, "loss": 0.3148, "learning_rate": 4.113912217353596e-05, "epoch": 0.9932432432432432, "percentage": 24.83, "elapsed_time": "0:38:59", "remaining_time": "1:58:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 295, "total_steps": 1184, "loss": 0.303, "learning_rate": 4.116370026630272e-05, "epoch": 0.9966216216216216, "percentage": 24.92, "elapsed_time": "0:39:04", "remaining_time": "1:57:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 296, "total_steps": 1184, "loss": 0.2768, "learning_rate": 4.118819518431564e-05, "epoch": 1.0, "percentage": 25.0, "elapsed_time": "0:39:09", "remaining_time": "1:57:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 297, "total_steps": 1184, "loss": 0.2319, "learning_rate": 4.121260748862021e-05, "epoch": 1.0033783783783783, "percentage": 25.08, "elapsed_time": "0:39:14", "remaining_time": "1:57:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 298, "total_steps": 1184, "loss": 0.2332, "learning_rate": 4.123693773460426e-05, "epoch": 1.0067567567567568, "percentage": 25.17, "elapsed_time": "0:39:20", "remaining_time": "1:56:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 299, "total_steps": 1184, "loss": 0.2113, "learning_rate": 4.126118647207383e-05, "epoch": 1.010135135135135, "percentage": 25.25, "elapsed_time": "0:39:25", "remaining_time": "1:56:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 300, "total_steps": 1184, "loss": 0.2428, "learning_rate": 4.1285354245327715e-05, "epoch": 1.0135135135135136, "percentage": 25.34, "elapsed_time": "0:39:30", "remaining_time": "1:56:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 301, "total_steps": 1184, "loss": 0.2394, "learning_rate": 4.1309441593230726e-05, "epoch": 1.0168918918918919, "percentage": 25.42, "elapsed_time": "0:39:35", "remaining_time": "1:56:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 302, "total_steps": 1184, "loss": 0.2584, "learning_rate": 4.133344904928585e-05, "epoch": 1.0202702702702702, "percentage": 25.51, "elapsed_time": "0:39:40", "remaining_time": "1:55:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 303, "total_steps": 1184, "loss": 0.2191, "learning_rate": 4.1357377141705084e-05, "epoch": 1.0236486486486487, "percentage": 25.59, "elapsed_time": "0:39:45", "remaining_time": "1:55:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 304, "total_steps": 1184, "loss": 0.2185, "learning_rate": 4.1381226393479236e-05, "epoch": 1.027027027027027, "percentage": 25.68, "elapsed_time": "0:39:50", "remaining_time": "1:55:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 305, "total_steps": 1184, "loss": 0.2328, "learning_rate": 4.1404997322446435e-05, "epoch": 1.0304054054054055, "percentage": 25.76, "elapsed_time": "0:39:55", "remaining_time": "1:55:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 306, "total_steps": 1184, "loss": 0.2197, "learning_rate": 4.142869044135967e-05, "epoch": 1.0337837837837838, "percentage": 25.84, "elapsed_time": "0:40:01", "remaining_time": "1:54:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 307, "total_steps": 1184, "loss": 0.2093, "learning_rate": 4.145230625795311e-05, "epoch": 1.037162162162162, "percentage": 25.93, "elapsed_time": "0:40:06", "remaining_time": "1:54:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 308, "total_steps": 1184, "loss": 0.2145, "learning_rate": 4.14758452750074e-05, "epoch": 1.0405405405405406, "percentage": 26.01, "elapsed_time": "0:40:11", "remaining_time": "1:54:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 309, "total_steps": 1184, "loss": 0.222, "learning_rate": 4.149930799041392e-05, "epoch": 1.0439189189189189, "percentage": 26.1, "elapsed_time": "0:40:16", "remaining_time": "1:54:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 310, "total_steps": 1184, "loss": 0.2245, "learning_rate": 4.152269489723788e-05, "epoch": 1.0472972972972974, "percentage": 26.18, "elapsed_time": "0:40:21", "remaining_time": "1:53:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 311, "total_steps": 1184, "loss": 0.2428, "learning_rate": 4.1546006483780626e-05, "epoch": 1.0506756756756757, "percentage": 26.27, "elapsed_time": "0:40:26", "remaining_time": "1:53:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 312, "total_steps": 1184, "loss": 0.2311, "learning_rate": 4.156924323364072e-05, "epoch": 1.054054054054054, "percentage": 26.35, "elapsed_time": "0:40:31", "remaining_time": "1:53:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 313, "total_steps": 1184, "loss": 0.2315, "learning_rate": 4.1592405625774144e-05, "epoch": 1.0574324324324325, "percentage": 26.44, "elapsed_time": "0:40:36", "remaining_time": "1:53:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 314, "total_steps": 1184, "loss": 0.2205, "learning_rate": 4.161549413455358e-05, "epoch": 1.0608108108108107, "percentage": 26.52, "elapsed_time": "0:40:42", "remaining_time": "1:52:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 315, "total_steps": 1184, "loss": 0.1969, "learning_rate": 4.163850922982668e-05, "epoch": 1.0641891891891893, "percentage": 26.6, "elapsed_time": "0:40:47", "remaining_time": "1:52:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 316, "total_steps": 1184, "loss": 0.2183, "learning_rate": 4.16614513769734e-05, "epoch": 1.0675675675675675, "percentage": 26.69, "elapsed_time": "0:40:52", "remaining_time": "1:52:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 317, "total_steps": 1184, "loss": 0.2581, "learning_rate": 4.1684321036962526e-05, "epoch": 1.070945945945946, "percentage": 26.77, "elapsed_time": "0:40:57", "remaining_time": "1:52:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 318, "total_steps": 1184, "loss": 0.2454, "learning_rate": 4.170711866640721e-05, "epoch": 1.0743243243243243, "percentage": 26.86, "elapsed_time": "0:41:02", "remaining_time": "1:51:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 319, "total_steps": 1184, "loss": 0.2303, "learning_rate": 4.1729844717619684e-05, "epoch": 1.0777027027027026, "percentage": 26.94, "elapsed_time": "0:41:07", "remaining_time": "1:51:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 320, "total_steps": 1184, "loss": 0.2205, "learning_rate": 4.17524996386651e-05, "epoch": 1.0810810810810811, "percentage": 27.03, "elapsed_time": "0:41:12", "remaining_time": "1:51:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 321, "total_steps": 1184, "loss": 0.2538, "learning_rate": 4.177508387341454e-05, "epoch": 1.0844594594594594, "percentage": 27.11, "elapsed_time": "0:41:17", "remaining_time": "1:51:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 322, "total_steps": 1184, "loss": 0.5427, "learning_rate": 4.179759786159719e-05, "epoch": 1.087837837837838, "percentage": 27.2, "elapsed_time": "0:41:23", "remaining_time": "1:50:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 323, "total_steps": 1184, "loss": 0.2445, "learning_rate": 4.182004203885172e-05, "epoch": 1.0912162162162162, "percentage": 27.28, "elapsed_time": "0:41:28", "remaining_time": "1:50:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 324, "total_steps": 1184, "loss": 0.2577, "learning_rate": 4.184241683677687e-05, "epoch": 1.0945945945945945, "percentage": 27.36, "elapsed_time": "0:41:33", "remaining_time": "1:50:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 325, "total_steps": 1184, "loss": 0.2421, "learning_rate": 4.1864722682981245e-05, "epoch": 1.097972972972973, "percentage": 27.45, "elapsed_time": "0:41:38", "remaining_time": "1:50:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 326, "total_steps": 1184, "loss": 0.2122, "learning_rate": 4.188696000113232e-05, "epoch": 1.1013513513513513, "percentage": 27.53, "elapsed_time": "0:41:43", "remaining_time": "1:49:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 327, "total_steps": 1184, "loss": 0.2295, "learning_rate": 4.190912921100477e-05, "epoch": 1.1047297297297298, "percentage": 27.62, "elapsed_time": "0:41:48", "remaining_time": "1:49:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 328, "total_steps": 1184, "loss": 0.2352, "learning_rate": 4.1931230728527994e-05, "epoch": 1.1081081081081081, "percentage": 27.7, "elapsed_time": "0:41:53", "remaining_time": "1:49:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 329, "total_steps": 1184, "loss": 0.7099, "learning_rate": 4.195326496583291e-05, "epoch": 1.1114864864864864, "percentage": 27.79, "elapsed_time": "0:41:58", "remaining_time": "1:49:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 330, "total_steps": 1184, "loss": 0.2105, "learning_rate": 4.1975232331298125e-05, "epoch": 1.114864864864865, "percentage": 27.87, "elapsed_time": "0:42:04", "remaining_time": "1:48:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 331, "total_steps": 1184, "loss": 0.2063, "learning_rate": 4.1997133229595316e-05, "epoch": 1.1182432432432432, "percentage": 27.96, "elapsed_time": "0:42:09", "remaining_time": "1:48:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 332, "total_steps": 1184, "loss": 0.2447, "learning_rate": 4.201896806173394e-05, "epoch": 1.1216216216216217, "percentage": 28.04, "elapsed_time": "0:42:14", "remaining_time": "1:48:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 333, "total_steps": 1184, "loss": 0.2298, "learning_rate": 4.2040737225105335e-05, "epoch": 1.125, "percentage": 28.12, "elapsed_time": "0:42:19", "remaining_time": "1:48:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 334, "total_steps": 1184, "loss": 0.1799, "learning_rate": 4.206244111352608e-05, "epoch": 1.1283783783783783, "percentage": 28.21, "elapsed_time": "0:42:24", "remaining_time": "1:47:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 335, "total_steps": 1184, "loss": 0.2254, "learning_rate": 4.2084080117280756e-05, "epoch": 1.1317567567567568, "percentage": 28.29, "elapsed_time": "0:42:29", "remaining_time": "1:47:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 336, "total_steps": 1184, "loss": 0.2342, "learning_rate": 4.210565462316407e-05, "epoch": 1.135135135135135, "percentage": 28.38, "elapsed_time": "0:42:34", "remaining_time": "1:47:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 337, "total_steps": 1184, "loss": 0.2384, "learning_rate": 4.2127165014522315e-05, "epoch": 1.1385135135135136, "percentage": 28.46, "elapsed_time": "0:42:39", "remaining_time": "1:47:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 338, "total_steps": 1184, "loss": 0.2213, "learning_rate": 4.214861167129425e-05, "epoch": 1.1418918918918919, "percentage": 28.55, "elapsed_time": "0:42:45", "remaining_time": "1:47:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 339, "total_steps": 1184, "loss": 0.8302, "learning_rate": 4.2169994970051365e-05, "epoch": 1.1452702702702702, "percentage": 28.63, "elapsed_time": "0:42:50", "remaining_time": "1:46:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 340, "total_steps": 1184, "loss": 0.2568, "learning_rate": 4.219131528403759e-05, "epoch": 1.1486486486486487, "percentage": 28.72, "elapsed_time": "0:42:55", "remaining_time": "1:46:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 341, "total_steps": 1184, "loss": 0.2574, "learning_rate": 4.22125729832083e-05, "epoch": 1.152027027027027, "percentage": 28.8, "elapsed_time": "0:43:00", "remaining_time": "1:46:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 342, "total_steps": 1184, "loss": 0.8118, "learning_rate": 4.2233768434268914e-05, "epoch": 1.1554054054054055, "percentage": 28.89, "elapsed_time": "0:43:05", "remaining_time": "1:46:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 343, "total_steps": 1184, "loss": 0.2347, "learning_rate": 4.225490200071284e-05, "epoch": 1.1587837837837838, "percentage": 28.97, "elapsed_time": "0:43:10", "remaining_time": "1:45:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 344, "total_steps": 1184, "loss": 0.2453, "learning_rate": 4.227597404285883e-05, "epoch": 1.1621621621621623, "percentage": 29.05, "elapsed_time": "0:43:15", "remaining_time": "1:45:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 345, "total_steps": 1184, "loss": 0.2313, "learning_rate": 4.229698491788791e-05, "epoch": 1.1655405405405406, "percentage": 29.14, "elapsed_time": "0:43:20", "remaining_time": "1:45:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 346, "total_steps": 1184, "loss": 0.256, "learning_rate": 4.231793497987961e-05, "epoch": 1.1689189189189189, "percentage": 29.22, "elapsed_time": "0:43:25", "remaining_time": "1:45:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 347, "total_steps": 1184, "loss": 0.2655, "learning_rate": 4.2338824579847904e-05, "epoch": 1.1722972972972974, "percentage": 29.31, "elapsed_time": "0:43:31", "remaining_time": "1:44:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 348, "total_steps": 1184, "loss": 0.2385, "learning_rate": 4.235965406577636e-05, "epoch": 1.1756756756756757, "percentage": 29.39, "elapsed_time": "0:43:36", "remaining_time": "1:44:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 349, "total_steps": 1184, "loss": 0.2196, "learning_rate": 4.2380423782653e-05, "epoch": 1.179054054054054, "percentage": 29.48, "elapsed_time": "0:43:41", "remaining_time": "1:44:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 350, "total_steps": 1184, "loss": 0.2337, "learning_rate": 4.240113407250459e-05, "epoch": 1.1824324324324325, "percentage": 29.56, "elapsed_time": "0:43:46", "remaining_time": "1:44:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 351, "total_steps": 1184, "loss": 0.2438, "learning_rate": 4.24217852744304e-05, "epoch": 1.1858108108108107, "percentage": 29.65, "elapsed_time": "0:43:51", "remaining_time": "1:44:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 352, "total_steps": 1184, "loss": 0.2458, "learning_rate": 4.244237772463552e-05, "epoch": 1.1891891891891893, "percentage": 29.73, "elapsed_time": "0:43:56", "remaining_time": "1:43:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 353, "total_steps": 1184, "loss": 0.2391, "learning_rate": 4.246291175646371e-05, "epoch": 1.1925675675675675, "percentage": 29.81, "elapsed_time": "0:44:01", "remaining_time": "1:43:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 354, "total_steps": 1184, "loss": 0.2299, "learning_rate": 4.24833877004298e-05, "epoch": 1.195945945945946, "percentage": 29.9, "elapsed_time": "0:44:06", "remaining_time": "1:43:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 355, "total_steps": 1184, "loss": 0.2272, "learning_rate": 4.250380588425157e-05, "epoch": 1.1993243243243243, "percentage": 29.98, "elapsed_time": "0:44:12", "remaining_time": "1:43:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 356, "total_steps": 1184, "loss": 0.2737, "learning_rate": 4.2524166632881255e-05, "epoch": 1.2027027027027026, "percentage": 30.07, "elapsed_time": "0:44:17", "remaining_time": "1:43:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 357, "total_steps": 1184, "loss": 0.2648, "learning_rate": 4.254447026853656e-05, "epoch": 1.2060810810810811, "percentage": 30.15, "elapsed_time": "0:44:22", "remaining_time": "1:42:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 358, "total_steps": 1184, "loss": 0.2643, "learning_rate": 4.2564717110731244e-05, "epoch": 1.2094594594594594, "percentage": 30.24, "elapsed_time": "0:44:27", "remaining_time": "1:42:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 359, "total_steps": 1184, "loss": 0.6041, "learning_rate": 4.258490747630532e-05, "epoch": 1.2128378378378377, "percentage": 30.32, "elapsed_time": "0:44:32", "remaining_time": "1:42:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 360, "total_steps": 1184, "loss": 0.2226, "learning_rate": 4.260504167945479e-05, "epoch": 1.2162162162162162, "percentage": 30.41, "elapsed_time": "0:44:37", "remaining_time": "1:42:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 361, "total_steps": 1184, "loss": 0.2205, "learning_rate": 4.2625120031760965e-05, "epoch": 1.2195945945945945, "percentage": 30.49, "elapsed_time": "0:44:42", "remaining_time": "1:41:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 362, "total_steps": 1184, "loss": 0.2272, "learning_rate": 4.264514284221944e-05, "epoch": 1.222972972972973, "percentage": 30.57, "elapsed_time": "0:44:48", "remaining_time": "1:41:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 363, "total_steps": 1184, "loss": 0.2536, "learning_rate": 4.266511041726854e-05, "epoch": 1.2263513513513513, "percentage": 30.66, "elapsed_time": "0:44:53", "remaining_time": "1:41:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 364, "total_steps": 1184, "loss": 0.2582, "learning_rate": 4.26850230608176e-05, "epoch": 1.2297297297297298, "percentage": 30.74, "elapsed_time": "0:44:58", "remaining_time": "1:41:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 365, "total_steps": 1184, "loss": 0.2288, "learning_rate": 4.2704881074274584e-05, "epoch": 1.2331081081081081, "percentage": 30.83, "elapsed_time": "0:45:03", "remaining_time": "1:41:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 366, "total_steps": 1184, "loss": 0.2396, "learning_rate": 4.272468475657351e-05, "epoch": 1.2364864864864864, "percentage": 30.91, "elapsed_time": "0:45:08", "remaining_time": "1:40:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 367, "total_steps": 1184, "loss": 1.9213, "learning_rate": 4.2744434404201497e-05, "epoch": 1.239864864864865, "percentage": 31.0, "elapsed_time": "0:45:13", "remaining_time": "1:40:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 368, "total_steps": 1184, "loss": 0.2528, "learning_rate": 4.27641303112253e-05, "epoch": 1.2432432432432432, "percentage": 31.08, "elapsed_time": "0:45:18", "remaining_time": "1:40:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 369, "total_steps": 1184, "loss": 0.2235, "learning_rate": 4.278377276931767e-05, "epoch": 1.2466216216216217, "percentage": 31.17, "elapsed_time": "0:45:24", "remaining_time": "1:40:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 370, "total_steps": 1184, "loss": 0.2111, "learning_rate": 4.2803362067783256e-05, "epoch": 1.25, "percentage": 31.25, "elapsed_time": "0:45:29", "remaining_time": "1:40:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 371, "total_steps": 1184, "loss": 0.2256, "learning_rate": 4.2822898493584104e-05, "epoch": 1.2533783783783785, "percentage": 31.33, "elapsed_time": "0:45:34", "remaining_time": "1:39:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 372, "total_steps": 1184, "loss": 0.2295, "learning_rate": 4.284238233136496e-05, "epoch": 1.2567567567567568, "percentage": 31.42, "elapsed_time": "0:45:39", "remaining_time": "1:39:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 373, "total_steps": 1184, "loss": 0.2394, "learning_rate": 4.286181386347813e-05, "epoch": 1.260135135135135, "percentage": 31.5, "elapsed_time": "0:45:44", "remaining_time": "1:39:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 374, "total_steps": 1184, "loss": 0.2108, "learning_rate": 4.288119337000801e-05, "epoch": 1.2635135135135136, "percentage": 31.59, "elapsed_time": "0:45:49", "remaining_time": "1:39:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 375, "total_steps": 1184, "loss": 0.2192, "learning_rate": 4.2900521128795315e-05, "epoch": 1.2668918918918919, "percentage": 31.67, "elapsed_time": "0:45:54", "remaining_time": "1:39:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 376, "total_steps": 1184, "loss": 0.2403, "learning_rate": 4.291979741546102e-05, "epoch": 1.2702702702702702, "percentage": 31.76, "elapsed_time": "0:45:59", "remaining_time": "1:38:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 377, "total_steps": 1184, "loss": 0.2086, "learning_rate": 4.293902250342989e-05, "epoch": 1.2736486486486487, "percentage": 31.84, "elapsed_time": "0:46:05", "remaining_time": "1:38:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 378, "total_steps": 1184, "loss": 0.236, "learning_rate": 4.295819666395376e-05, "epoch": 1.277027027027027, "percentage": 31.93, "elapsed_time": "0:46:10", "remaining_time": "1:38:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 379, "total_steps": 1184, "loss": 0.2271, "learning_rate": 4.297732016613454e-05, "epoch": 1.2804054054054055, "percentage": 32.01, "elapsed_time": "0:46:15", "remaining_time": "1:38:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 380, "total_steps": 1184, "loss": 0.2356, "learning_rate": 4.299639327694684e-05, "epoch": 1.2837837837837838, "percentage": 32.09, "elapsed_time": "0:46:20", "remaining_time": "1:38:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 381, "total_steps": 1184, "loss": 0.2247, "learning_rate": 4.3015416261260325e-05, "epoch": 1.2871621621621623, "percentage": 32.18, "elapsed_time": "0:46:25", "remaining_time": "1:37:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 382, "total_steps": 1184, "loss": 0.2477, "learning_rate": 4.303438938186182e-05, "epoch": 1.2905405405405406, "percentage": 32.26, "elapsed_time": "0:46:30", "remaining_time": "1:37:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 383, "total_steps": 1184, "loss": 0.221, "learning_rate": 4.305331289947705e-05, "epoch": 1.2939189189189189, "percentage": 32.35, "elapsed_time": "0:46:35", "remaining_time": "1:37:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 384, "total_steps": 1184, "loss": 0.2443, "learning_rate": 4.3072187072792184e-05, "epoch": 1.2972972972972974, "percentage": 32.43, "elapsed_time": "0:46:40", "remaining_time": "1:37:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 385, "total_steps": 1184, "loss": 0.2043, "learning_rate": 4.309101215847502e-05, "epoch": 1.3006756756756757, "percentage": 32.52, "elapsed_time": "0:46:46", "remaining_time": "1:37:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 386, "total_steps": 1184, "loss": 0.246, "learning_rate": 4.3109788411195924e-05, "epoch": 1.304054054054054, "percentage": 32.6, "elapsed_time": "0:46:51", "remaining_time": "1:36:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 387, "total_steps": 1184, "loss": 0.2305, "learning_rate": 4.312851608364853e-05, "epoch": 1.3074324324324325, "percentage": 32.69, "elapsed_time": "0:46:56", "remaining_time": "1:36:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 388, "total_steps": 1184, "loss": 0.2146, "learning_rate": 4.314719542657013e-05, "epoch": 1.3108108108108107, "percentage": 32.77, "elapsed_time": "0:47:01", "remaining_time": "1:36:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 389, "total_steps": 1184, "loss": 1.1445, "learning_rate": 4.3165826688761796e-05, "epoch": 1.3141891891891893, "percentage": 32.85, "elapsed_time": "0:47:06", "remaining_time": "1:36:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 390, "total_steps": 1184, "loss": 0.2591, "learning_rate": 4.318441011710833e-05, "epoch": 1.3175675675675675, "percentage": 32.94, "elapsed_time": "0:47:11", "remaining_time": "1:36:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 391, "total_steps": 1184, "loss": 0.2409, "learning_rate": 4.3202945956597786e-05, "epoch": 1.320945945945946, "percentage": 33.02, "elapsed_time": "0:47:16", "remaining_time": "1:35:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 392, "total_steps": 1184, "loss": 1.022, "learning_rate": 4.3221434450340956e-05, "epoch": 1.3243243243243243, "percentage": 33.11, "elapsed_time": "0:47:21", "remaining_time": "1:35:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 393, "total_steps": 1184, "loss": 0.2287, "learning_rate": 4.323987583959045e-05, "epoch": 1.3277027027027026, "percentage": 33.19, "elapsed_time": "0:47:26", "remaining_time": "1:35:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 394, "total_steps": 1184, "loss": 0.2148, "learning_rate": 4.325827036375957e-05, "epoch": 1.3310810810810811, "percentage": 33.28, "elapsed_time": "0:47:32", "remaining_time": "1:35:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 395, "total_steps": 1184, "loss": 0.6968, "learning_rate": 4.327661826044101e-05, "epoch": 1.3344594594594594, "percentage": 33.36, "elapsed_time": "0:47:37", "remaining_time": "1:35:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 396, "total_steps": 1184, "loss": 0.6915, "learning_rate": 4.329491976542521e-05, "epoch": 1.3378378378378377, "percentage": 33.45, "elapsed_time": "0:47:42", "remaining_time": "1:34:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 397, "total_steps": 1184, "loss": 0.2388, "learning_rate": 4.331317511271859e-05, "epoch": 1.3412162162162162, "percentage": 33.53, "elapsed_time": "0:47:47", "remaining_time": "1:34:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 398, "total_steps": 1184, "loss": 0.2655, "learning_rate": 4.333138453456147e-05, "epoch": 1.3445945945945945, "percentage": 33.61, "elapsed_time": "0:47:52", "remaining_time": "1:34:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 399, "total_steps": 1184, "loss": 0.6129, "learning_rate": 4.334954826144581e-05, "epoch": 1.347972972972973, "percentage": 33.7, "elapsed_time": "0:47:57", "remaining_time": "1:34:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 400, "total_steps": 1184, "loss": 0.2492, "learning_rate": 4.336766652213271e-05, "epoch": 1.3513513513513513, "percentage": 33.78, "elapsed_time": "0:48:02", "remaining_time": "1:34:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 401, "total_steps": 1184, "loss": 0.2578, "learning_rate": 4.338573954366971e-05, "epoch": 1.3547297297297298, "percentage": 33.87, "elapsed_time": "0:48:07", "remaining_time": "1:33:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 402, "total_steps": 1184, "loss": 0.6334, "learning_rate": 4.340376755140784e-05, "epoch": 1.3581081081081081, "percentage": 33.95, "elapsed_time": "0:48:13", "remaining_time": "1:33:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 403, "total_steps": 1184, "loss": 0.2426, "learning_rate": 4.342175076901849e-05, "epoch": 1.3614864864864864, "percentage": 34.04, "elapsed_time": "0:48:18", "remaining_time": "1:33:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 404, "total_steps": 1184, "loss": 0.2715, "learning_rate": 4.343968941851009e-05, "epoch": 1.364864864864865, "percentage": 34.12, "elapsed_time": "0:48:23", "remaining_time": "1:33:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 405, "total_steps": 1184, "loss": 0.2462, "learning_rate": 4.345758372024448e-05, "epoch": 1.3682432432432432, "percentage": 34.21, "elapsed_time": "0:48:28", "remaining_time": "1:33:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 406, "total_steps": 1184, "loss": 0.5967, "learning_rate": 4.347543389295324e-05, "epoch": 1.3716216216216215, "percentage": 34.29, "elapsed_time": "0:48:33", "remaining_time": "1:33:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 407, "total_steps": 1184, "loss": 0.226, "learning_rate": 4.3493240153753666e-05, "epoch": 1.375, "percentage": 34.38, "elapsed_time": "0:48:38", "remaining_time": "1:32:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 408, "total_steps": 1184, "loss": 0.2266, "learning_rate": 4.3511002718164666e-05, "epoch": 1.3783783783783785, "percentage": 34.46, "elapsed_time": "0:48:43", "remaining_time": "1:32:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 409, "total_steps": 1184, "loss": 0.2028, "learning_rate": 4.352872180012237e-05, "epoch": 1.3817567567567568, "percentage": 34.54, "elapsed_time": "0:48:48", "remaining_time": "1:32:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 410, "total_steps": 1184, "loss": 0.2291, "learning_rate": 4.35463976119956e-05, "epoch": 1.385135135135135, "percentage": 34.63, "elapsed_time": "0:48:54", "remaining_time": "1:32:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 411, "total_steps": 1184, "loss": 0.2124, "learning_rate": 4.356403036460115e-05, "epoch": 1.3885135135135136, "percentage": 34.71, "elapsed_time": "0:48:59", "remaining_time": "1:32:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 412, "total_steps": 1184, "loss": 0.2013, "learning_rate": 4.3581620267218916e-05, "epoch": 1.3918918918918919, "percentage": 34.8, "elapsed_time": "0:49:04", "remaining_time": "1:31:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 413, "total_steps": 1184, "loss": 0.2439, "learning_rate": 4.359916752760669e-05, "epoch": 1.3952702702702702, "percentage": 34.88, "elapsed_time": "0:49:09", "remaining_time": "1:31:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 414, "total_steps": 1184, "loss": 0.2321, "learning_rate": 4.361667235201499e-05, "epoch": 1.3986486486486487, "percentage": 34.97, "elapsed_time": "0:49:14", "remaining_time": "1:31:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 415, "total_steps": 1184, "loss": 0.2418, "learning_rate": 4.363413494520154e-05, "epoch": 1.402027027027027, "percentage": 35.05, "elapsed_time": "0:49:19", "remaining_time": "1:31:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 416, "total_steps": 1184, "loss": 0.213, "learning_rate": 4.365155551044572e-05, "epoch": 1.4054054054054055, "percentage": 35.14, "elapsed_time": "0:49:25", "remaining_time": "1:31:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 417, "total_steps": 1184, "loss": 0.5716, "learning_rate": 4.366893424956263e-05, "epoch": 1.4087837837837838, "percentage": 35.22, "elapsed_time": "0:49:30", "remaining_time": "1:31:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 418, "total_steps": 1184, "loss": 0.2404, "learning_rate": 4.368627136291726e-05, "epoch": 1.4121621621621623, "percentage": 35.3, "elapsed_time": "0:49:35", "remaining_time": "1:30:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 419, "total_steps": 1184, "loss": 0.2349, "learning_rate": 4.370356704943825e-05, "epoch": 1.4155405405405406, "percentage": 35.39, "elapsed_time": "0:49:40", "remaining_time": "1:30:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 420, "total_steps": 1184, "loss": 0.2365, "learning_rate": 4.372082150663168e-05, "epoch": 1.4189189189189189, "percentage": 35.47, "elapsed_time": "0:49:45", "remaining_time": "1:30:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 421, "total_steps": 1184, "loss": 0.2256, "learning_rate": 4.3738034930594475e-05, "epoch": 1.4222972972972974, "percentage": 35.56, "elapsed_time": "0:49:51", "remaining_time": "1:30:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 422, "total_steps": 1184, "loss": 0.2283, "learning_rate": 4.3755207516027904e-05, "epoch": 1.4256756756756757, "percentage": 35.64, "elapsed_time": "0:49:56", "remaining_time": "1:30:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 423, "total_steps": 1184, "loss": 0.2374, "learning_rate": 4.377233945625071e-05, "epoch": 1.429054054054054, "percentage": 35.73, "elapsed_time": "0:50:02", "remaining_time": "1:30:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 424, "total_steps": 1184, "loss": 0.4887, "learning_rate": 4.378943094321221e-05, "epoch": 1.4324324324324325, "percentage": 35.81, "elapsed_time": "0:50:07", "remaining_time": "1:29:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 425, "total_steps": 1184, "loss": 0.2373, "learning_rate": 4.3806482167505196e-05, "epoch": 1.4358108108108107, "percentage": 35.9, "elapsed_time": "0:50:14", "remaining_time": "1:29:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 426, "total_steps": 1184, "loss": 0.5312, "learning_rate": 4.382349331837866e-05, "epoch": 1.4391891891891893, "percentage": 35.98, "elapsed_time": "0:50:20", "remaining_time": "1:29:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 427, "total_steps": 1184, "loss": 0.2347, "learning_rate": 4.3840464583750404e-05, "epoch": 1.4425675675675675, "percentage": 36.06, "elapsed_time": "0:50:25", "remaining_time": "1:29:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 428, "total_steps": 1184, "loss": 0.2392, "learning_rate": 4.385739615021954e-05, "epoch": 1.445945945945946, "percentage": 36.15, "elapsed_time": "0:50:30", "remaining_time": "1:29:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 429, "total_steps": 1184, "loss": 0.2346, "learning_rate": 4.387428820307874e-05, "epoch": 1.4493243243243243, "percentage": 36.23, "elapsed_time": "0:50:36", "remaining_time": "1:29:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 430, "total_steps": 1184, "loss": 0.2242, "learning_rate": 4.3891140926326446e-05, "epoch": 1.4527027027027026, "percentage": 36.32, "elapsed_time": "0:50:41", "remaining_time": "1:28:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 431, "total_steps": 1184, "loss": 0.2267, "learning_rate": 4.390795450267886e-05, "epoch": 1.4560810810810811, "percentage": 36.4, "elapsed_time": "0:50:46", "remaining_time": "1:28:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 432, "total_steps": 1184, "loss": 0.237, "learning_rate": 4.3924729113581876e-05, "epoch": 1.4594594594594594, "percentage": 36.49, "elapsed_time": "0:50:51", "remaining_time": "1:28:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 433, "total_steps": 1184, "loss": 0.2624, "learning_rate": 4.394146493922276e-05, "epoch": 1.4628378378378377, "percentage": 36.57, "elapsed_time": "0:50:56", "remaining_time": "1:28:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 434, "total_steps": 1184, "loss": 0.2076, "learning_rate": 4.395816215854185e-05, "epoch": 1.4662162162162162, "percentage": 36.66, "elapsed_time": "0:51:01", "remaining_time": "1:28:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 435, "total_steps": 1184, "loss": 0.224, "learning_rate": 4.397482094924396e-05, "epoch": 1.4695945945945945, "percentage": 36.74, "elapsed_time": "0:51:06", "remaining_time": "1:28:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 436, "total_steps": 1184, "loss": 0.5361, "learning_rate": 4.399144148780977e-05, "epoch": 1.472972972972973, "percentage": 36.82, "elapsed_time": "0:51:11", "remaining_time": "1:27:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 437, "total_steps": 1184, "loss": 0.2274, "learning_rate": 4.400802394950703e-05, "epoch": 1.4763513513513513, "percentage": 36.91, "elapsed_time": "0:51:17", "remaining_time": "1:27:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 438, "total_steps": 1184, "loss": 0.2295, "learning_rate": 4.402456850840166e-05, "epoch": 1.4797297297297298, "percentage": 36.99, "elapsed_time": "0:51:22", "remaining_time": "1:27:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 439, "total_steps": 1184, "loss": 0.2447, "learning_rate": 4.4041075337368695e-05, "epoch": 1.4831081081081081, "percentage": 37.08, "elapsed_time": "0:51:27", "remaining_time": "1:27:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 440, "total_steps": 1184, "loss": 0.2522, "learning_rate": 4.405754460810312e-05, "epoch": 1.4864864864864864, "percentage": 37.16, "elapsed_time": "0:51:32", "remaining_time": "1:27:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 441, "total_steps": 1184, "loss": 0.8104, "learning_rate": 4.407397649113065e-05, "epoch": 1.489864864864865, "percentage": 37.25, "elapsed_time": "0:51:37", "remaining_time": "1:26:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 442, "total_steps": 1184, "loss": 0.2657, "learning_rate": 4.40903711558182e-05, "epoch": 1.4932432432432432, "percentage": 37.33, "elapsed_time": "0:51:42", "remaining_time": "1:26:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 443, "total_steps": 1184, "loss": 0.246, "learning_rate": 4.41067287703845e-05, "epoch": 1.4966216216216215, "percentage": 37.42, "elapsed_time": "0:51:47", "remaining_time": "1:26:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 444, "total_steps": 1184, "loss": 0.219, "learning_rate": 4.412304950191033e-05, "epoch": 1.5, "percentage": 37.5, "elapsed_time": "0:51:52", "remaining_time": "1:26:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 445, "total_steps": 1184, "loss": 0.2293, "learning_rate": 4.413933351634886e-05, "epoch": 1.5033783783783785, "percentage": 37.58, "elapsed_time": "0:51:57", "remaining_time": "1:26:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 446, "total_steps": 1184, "loss": 0.218, "learning_rate": 4.4155580978535707e-05, "epoch": 1.5067567567567568, "percentage": 37.67, "elapsed_time": "0:52:03", "remaining_time": "1:26:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 447, "total_steps": 1184, "loss": 0.2278, "learning_rate": 4.417179205219895e-05, "epoch": 1.510135135135135, "percentage": 37.75, "elapsed_time": "0:52:08", "remaining_time": "1:25:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 448, "total_steps": 1184, "loss": 0.2276, "learning_rate": 4.418796689996907e-05, "epoch": 1.5135135135135136, "percentage": 37.84, "elapsed_time": "0:52:13", "remaining_time": "1:25:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 449, "total_steps": 1184, "loss": 0.23, "learning_rate": 4.420410568338872e-05, "epoch": 1.5168918918918919, "percentage": 37.92, "elapsed_time": "0:52:18", "remaining_time": "1:25:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 450, "total_steps": 1184, "loss": 0.2445, "learning_rate": 4.42202085629224e-05, "epoch": 1.5202702702702702, "percentage": 38.01, "elapsed_time": "0:52:23", "remaining_time": "1:25:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 451, "total_steps": 1184, "loss": 0.2405, "learning_rate": 4.423627569796601e-05, "epoch": 1.5236486486486487, "percentage": 38.09, "elapsed_time": "0:52:28", "remaining_time": "1:25:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 452, "total_steps": 1184, "loss": 0.2299, "learning_rate": 4.425230724685638e-05, "epoch": 1.527027027027027, "percentage": 38.18, "elapsed_time": "0:52:33", "remaining_time": "1:25:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 453, "total_steps": 1184, "loss": 0.234, "learning_rate": 4.4268303366880536e-05, "epoch": 1.5304054054054053, "percentage": 38.26, "elapsed_time": "0:52:38", "remaining_time": "1:24:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 454, "total_steps": 1184, "loss": 0.2165, "learning_rate": 4.428426421428507e-05, "epoch": 1.5337837837837838, "percentage": 38.34, "elapsed_time": "0:52:44", "remaining_time": "1:24:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 455, "total_steps": 1184, "loss": 0.2648, "learning_rate": 4.430018994428521e-05, "epoch": 1.5371621621621623, "percentage": 38.43, "elapsed_time": "0:52:49", "remaining_time": "1:24:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 456, "total_steps": 1184, "loss": 0.2526, "learning_rate": 4.431608071107392e-05, "epoch": 1.5405405405405406, "percentage": 38.51, "elapsed_time": "0:52:54", "remaining_time": "1:24:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 457, "total_steps": 1184, "loss": 0.2428, "learning_rate": 4.433193666783084e-05, "epoch": 1.5439189189189189, "percentage": 38.6, "elapsed_time": "0:52:59", "remaining_time": "1:24:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 458, "total_steps": 1184, "loss": 0.2437, "learning_rate": 4.4347757966731156e-05, "epoch": 1.5472972972972974, "percentage": 38.68, "elapsed_time": "0:53:04", "remaining_time": "1:24:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 459, "total_steps": 1184, "loss": 0.233, "learning_rate": 4.436354475895436e-05, "epoch": 1.5506756756756757, "percentage": 38.77, "elapsed_time": "0:53:09", "remaining_time": "1:23:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 460, "total_steps": 1184, "loss": 0.2441, "learning_rate": 4.437929719469291e-05, "epoch": 1.554054054054054, "percentage": 38.85, "elapsed_time": "0:53:14", "remaining_time": "1:23:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 461, "total_steps": 1184, "loss": 0.2233, "learning_rate": 4.4395015423160807e-05, "epoch": 1.5574324324324325, "percentage": 38.94, "elapsed_time": "0:53:19", "remaining_time": "1:23:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 462, "total_steps": 1184, "loss": 0.225, "learning_rate": 4.4410699592602094e-05, "epoch": 1.560810810810811, "percentage": 39.02, "elapsed_time": "0:53:25", "remaining_time": "1:23:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 463, "total_steps": 1184, "loss": 0.4926, "learning_rate": 4.442634985029922e-05, "epoch": 1.564189189189189, "percentage": 39.1, "elapsed_time": "0:53:30", "remaining_time": "1:23:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 464, "total_steps": 1184, "loss": 0.2333, "learning_rate": 4.444196634258136e-05, "epoch": 1.5675675675675675, "percentage": 39.19, "elapsed_time": "0:53:35", "remaining_time": "1:23:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 465, "total_steps": 1184, "loss": 0.2457, "learning_rate": 4.4457549214832566e-05, "epoch": 1.570945945945946, "percentage": 39.27, "elapsed_time": "0:53:41", "remaining_time": "1:23:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 466, "total_steps": 1184, "loss": 0.2457, "learning_rate": 4.44730986115e-05, "epoch": 1.5743243243243243, "percentage": 39.36, "elapsed_time": "0:53:46", "remaining_time": "1:22:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 467, "total_steps": 1184, "loss": 0.2335, "learning_rate": 4.448861467610187e-05, "epoch": 1.5777027027027026, "percentage": 39.44, "elapsed_time": "0:53:51", "remaining_time": "1:22:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 468, "total_steps": 1184, "loss": 0.237, "learning_rate": 4.4504097551235406e-05, "epoch": 1.5810810810810811, "percentage": 39.53, "elapsed_time": "0:53:57", "remaining_time": "1:22:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 469, "total_steps": 1184, "loss": 0.24, "learning_rate": 4.4519547378584725e-05, "epoch": 1.5844594594594594, "percentage": 39.61, "elapsed_time": "0:54:02", "remaining_time": "1:22:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 470, "total_steps": 1184, "loss": 0.2252, "learning_rate": 4.453496429892863e-05, "epoch": 1.5878378378378377, "percentage": 39.7, "elapsed_time": "0:54:07", "remaining_time": "1:22:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 471, "total_steps": 1184, "loss": 0.2099, "learning_rate": 4.455034845214827e-05, "epoch": 1.5912162162162162, "percentage": 39.78, "elapsed_time": "0:54:12", "remaining_time": "1:22:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 472, "total_steps": 1184, "loss": 0.2135, "learning_rate": 4.4565699977234796e-05, "epoch": 1.5945945945945947, "percentage": 39.86, "elapsed_time": "0:54:17", "remaining_time": "1:21:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 473, "total_steps": 1184, "loss": 0.2346, "learning_rate": 4.458101901229686e-05, "epoch": 1.597972972972973, "percentage": 39.95, "elapsed_time": "0:54:22", "remaining_time": "1:21:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 474, "total_steps": 1184, "loss": 0.2198, "learning_rate": 4.459630569456809e-05, "epoch": 1.6013513513513513, "percentage": 40.03, "elapsed_time": "0:54:27", "remaining_time": "1:21:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 475, "total_steps": 1184, "loss": 0.2989, "learning_rate": 4.461156016041444e-05, "epoch": 1.6047297297297298, "percentage": 40.12, "elapsed_time": "0:54:32", "remaining_time": "1:21:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 476, "total_steps": 1184, "loss": 0.5155, "learning_rate": 4.462678254534156e-05, "epoch": 1.6081081081081081, "percentage": 40.2, "elapsed_time": "0:54:37", "remaining_time": "1:21:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 477, "total_steps": 1184, "loss": 0.2645, "learning_rate": 4.464197298400191e-05, "epoch": 1.6114864864864864, "percentage": 40.29, "elapsed_time": "0:54:43", "remaining_time": "1:21:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 478, "total_steps": 1184, "loss": 0.5192, "learning_rate": 4.4657131610201994e-05, "epoch": 1.614864864864865, "percentage": 40.37, "elapsed_time": "0:54:48", "remaining_time": "1:20:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 479, "total_steps": 1184, "loss": 0.2187, "learning_rate": 4.467225855690939e-05, "epoch": 1.6182432432432432, "percentage": 40.46, "elapsed_time": "0:54:53", "remaining_time": "1:20:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 480, "total_steps": 1184, "loss": 0.2214, "learning_rate": 4.468735395625979e-05, "epoch": 1.6216216216216215, "percentage": 40.54, "elapsed_time": "0:54:58", "remaining_time": "1:20:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 481, "total_steps": 1184, "loss": 0.2414, "learning_rate": 4.470241793956387e-05, "epoch": 1.625, "percentage": 40.62, "elapsed_time": "0:55:03", "remaining_time": "1:20:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 482, "total_steps": 1184, "loss": 0.2386, "learning_rate": 4.471745063731416e-05, "epoch": 1.6283783783783785, "percentage": 40.71, "elapsed_time": "0:55:08", "remaining_time": "1:20:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 483, "total_steps": 1184, "loss": 0.1981, "learning_rate": 4.473245217919187e-05, "epoch": 1.6317567567567568, "percentage": 40.79, "elapsed_time": "0:55:13", "remaining_time": "1:20:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 484, "total_steps": 1184, "loss": 0.2212, "learning_rate": 4.474742269407355e-05, "epoch": 1.635135135135135, "percentage": 40.88, "elapsed_time": "0:55:19", "remaining_time": "1:20:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 485, "total_steps": 1184, "loss": 0.2753, "learning_rate": 4.476236231003773e-05, "epoch": 1.6385135135135136, "percentage": 40.96, "elapsed_time": "0:55:24", "remaining_time": "1:19:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 486, "total_steps": 1184, "loss": 0.2571, "learning_rate": 4.477727115437156e-05, "epoch": 1.6418918918918919, "percentage": 41.05, "elapsed_time": "0:55:29", "remaining_time": "1:19:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 487, "total_steps": 1184, "loss": 0.2341, "learning_rate": 4.479214935357724e-05, "epoch": 1.6452702702702702, "percentage": 41.13, "elapsed_time": "0:55:34", "remaining_time": "1:19:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 488, "total_steps": 1184, "loss": 0.2533, "learning_rate": 4.480699703337852e-05, "epoch": 1.6486486486486487, "percentage": 41.22, "elapsed_time": "0:55:39", "remaining_time": "1:19:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 489, "total_steps": 1184, "loss": 0.2394, "learning_rate": 4.4821814318727016e-05, "epoch": 1.652027027027027, "percentage": 41.3, "elapsed_time": "0:55:44", "remaining_time": "1:19:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 490, "total_steps": 1184, "loss": 0.2005, "learning_rate": 4.483660133380856e-05, "epoch": 1.6554054054054053, "percentage": 41.39, "elapsed_time": "0:55:49", "remaining_time": "1:19:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 491, "total_steps": 1184, "loss": 0.231, "learning_rate": 4.485135820204948e-05, "epoch": 1.6587837837837838, "percentage": 41.47, "elapsed_time": "0:55:54", "remaining_time": "1:18:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 492, "total_steps": 1184, "loss": 0.2529, "learning_rate": 4.486608504612267e-05, "epoch": 1.6621621621621623, "percentage": 41.55, "elapsed_time": "0:56:00", "remaining_time": "1:18:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 493, "total_steps": 1184, "loss": 0.2485, "learning_rate": 4.488078198795383e-05, "epoch": 1.6655405405405406, "percentage": 41.64, "elapsed_time": "0:56:05", "remaining_time": "1:18:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 494, "total_steps": 1184, "loss": 0.2375, "learning_rate": 4.489544914872745e-05, "epoch": 1.6689189189189189, "percentage": 41.72, "elapsed_time": "0:56:10", "remaining_time": "1:18:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 495, "total_steps": 1184, "loss": 0.2461, "learning_rate": 4.4910086648892815e-05, "epoch": 1.6722972972972974, "percentage": 41.81, "elapsed_time": "0:56:15", "remaining_time": "1:18:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 496, "total_steps": 1184, "loss": 0.2301, "learning_rate": 4.4924694608169965e-05, "epoch": 1.6756756756756757, "percentage": 41.89, "elapsed_time": "0:56:20", "remaining_time": "1:18:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 497, "total_steps": 1184, "loss": 0.235, "learning_rate": 4.4939273145555536e-05, "epoch": 1.679054054054054, "percentage": 41.98, "elapsed_time": "0:56:25", "remaining_time": "1:18:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 498, "total_steps": 1184, "loss": 0.23, "learning_rate": 4.495382237932863e-05, "epoch": 1.6824324324324325, "percentage": 42.06, "elapsed_time": "0:56:30", "remaining_time": "1:17:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 499, "total_steps": 1184, "loss": 0.2374, "learning_rate": 4.4968342427056505e-05, "epoch": 1.685810810810811, "percentage": 42.15, "elapsed_time": "0:56:36", "remaining_time": "1:17:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 500, "total_steps": 1184, "loss": 0.3647, "learning_rate": 4.498283340560031e-05, "epoch": 1.689189189189189, "percentage": 42.23, "elapsed_time": "0:56:41", "remaining_time": "1:17:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 501, "total_steps": 1184, "loss": 0.2686, "learning_rate": 4.499729543112076e-05, "epoch": 1.6925675675675675, "percentage": 42.31, "elapsed_time": "1:10:15", "remaining_time": "1:35:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 502, "total_steps": 1184, "loss": 0.2521, "learning_rate": 4.501172861908366e-05, "epoch": 1.695945945945946, "percentage": 42.4, "elapsed_time": "1:10:20", "remaining_time": "1:35:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 503, "total_steps": 1184, "loss": 0.2447, "learning_rate": 4.502613308426546e-05, "epoch": 1.6993243243243243, "percentage": 42.48, "elapsed_time": "1:10:25", "remaining_time": "1:35:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 504, "total_steps": 1184, "loss": 0.2379, "learning_rate": 4.504050894075876e-05, "epoch": 1.7027027027027026, "percentage": 42.57, "elapsed_time": "1:10:30", "remaining_time": "1:35:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 505, "total_steps": 1184, "loss": 0.2399, "learning_rate": 4.5054856301977696e-05, "epoch": 1.7060810810810811, "percentage": 42.65, "elapsed_time": "1:10:35", "remaining_time": "1:34:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 506, "total_steps": 1184, "loss": 0.229, "learning_rate": 4.506917528066332e-05, "epoch": 1.7094594594594594, "percentage": 42.74, "elapsed_time": "1:10:40", "remaining_time": "1:34:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 507, "total_steps": 1184, "loss": 0.2237, "learning_rate": 4.508346598888894e-05, "epoch": 1.7128378378378377, "percentage": 42.82, "elapsed_time": "1:10:45", "remaining_time": "1:34:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 508, "total_steps": 1184, "loss": 0.2175, "learning_rate": 4.509772853806532e-05, "epoch": 1.7162162162162162, "percentage": 42.91, "elapsed_time": "1:10:50", "remaining_time": "1:34:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 509, "total_steps": 1184, "loss": 0.2444, "learning_rate": 4.511196303894598e-05, "epoch": 1.7195945945945947, "percentage": 42.99, "elapsed_time": "1:10:55", "remaining_time": "1:34:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 510, "total_steps": 1184, "loss": 0.2357, "learning_rate": 4.512616960163227e-05, "epoch": 1.722972972972973, "percentage": 43.07, "elapsed_time": "1:11:00", "remaining_time": "1:33:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 511, "total_steps": 1184, "loss": 0.2375, "learning_rate": 4.5140348335578547e-05, "epoch": 1.7263513513513513, "percentage": 43.16, "elapsed_time": "1:11:06", "remaining_time": "1:33:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 512, "total_steps": 1184, "loss": 0.2444, "learning_rate": 4.515449934959718e-05, "epoch": 1.7297297297297298, "percentage": 43.24, "elapsed_time": "1:11:11", "remaining_time": "1:33:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 513, "total_steps": 1184, "loss": 0.2324, "learning_rate": 4.516862275186361e-05, "epoch": 1.7331081081081081, "percentage": 43.33, "elapsed_time": "1:11:16", "remaining_time": "1:33:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 514, "total_steps": 1184, "loss": 0.2359, "learning_rate": 4.518271864992127e-05, "epoch": 1.7364864864864864, "percentage": 43.41, "elapsed_time": "1:11:21", "remaining_time": "1:33:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 515, "total_steps": 1184, "loss": 0.2708, "learning_rate": 4.519678715068652e-05, "epoch": 1.739864864864865, "percentage": 43.5, "elapsed_time": "1:11:26", "remaining_time": "1:32:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 516, "total_steps": 1184, "loss": 0.2452, "learning_rate": 4.521082836045353e-05, "epoch": 1.7432432432432432, "percentage": 43.58, "elapsed_time": "1:11:31", "remaining_time": "1:32:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 517, "total_steps": 1184, "loss": 0.2344, "learning_rate": 4.5224842384899045e-05, "epoch": 1.7466216216216215, "percentage": 43.67, "elapsed_time": "1:11:36", "remaining_time": "1:32:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 518, "total_steps": 1184, "loss": 0.2511, "learning_rate": 4.523882932908722e-05, "epoch": 1.75, "percentage": 43.75, "elapsed_time": "1:11:41", "remaining_time": "1:32:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 519, "total_steps": 1184, "loss": 0.2162, "learning_rate": 4.52527892974743e-05, "epoch": 1.7533783783783785, "percentage": 43.83, "elapsed_time": "1:11:46", "remaining_time": "1:31:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 520, "total_steps": 1184, "loss": 0.2281, "learning_rate": 4.526672239391333e-05, "epoch": 1.7567567567567568, "percentage": 43.92, "elapsed_time": "1:11:52", "remaining_time": "1:31:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 521, "total_steps": 1184, "loss": 0.2257, "learning_rate": 4.528062872165875e-05, "epoch": 1.760135135135135, "percentage": 44.0, "elapsed_time": "1:11:57", "remaining_time": "1:31:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 522, "total_steps": 1184, "loss": 0.2304, "learning_rate": 4.529450838337104e-05, "epoch": 1.7635135135135136, "percentage": 44.09, "elapsed_time": "1:12:02", "remaining_time": "1:31:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 523, "total_steps": 1184, "loss": 0.2341, "learning_rate": 4.530836148112124e-05, "epoch": 1.7668918918918919, "percentage": 44.17, "elapsed_time": "1:12:07", "remaining_time": "1:31:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 524, "total_steps": 1184, "loss": 0.272, "learning_rate": 4.532218811639545e-05, "epoch": 1.7702702702702702, "percentage": 44.26, "elapsed_time": "1:12:12", "remaining_time": "1:30:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 525, "total_steps": 1184, "loss": 0.2195, "learning_rate": 4.5335988390099284e-05, "epoch": 1.7736486486486487, "percentage": 44.34, "elapsed_time": "1:12:17", "remaining_time": "1:30:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 526, "total_steps": 1184, "loss": 0.2335, "learning_rate": 4.534976240256232e-05, "epoch": 1.777027027027027, "percentage": 44.43, "elapsed_time": "1:12:22", "remaining_time": "1:30:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 527, "total_steps": 1184, "loss": 0.4532, "learning_rate": 4.536351025354245e-05, "epoch": 1.7804054054054053, "percentage": 44.51, "elapsed_time": "1:12:27", "remaining_time": "1:30:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 528, "total_steps": 1184, "loss": 0.2541, "learning_rate": 4.537723204223021e-05, "epoch": 1.7837837837837838, "percentage": 44.59, "elapsed_time": "1:12:32", "remaining_time": "1:30:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 529, "total_steps": 1184, "loss": 0.2287, "learning_rate": 4.53909278672531e-05, "epoch": 1.7871621621621623, "percentage": 44.68, "elapsed_time": "1:12:38", "remaining_time": "1:29:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 530, "total_steps": 1184, "loss": 0.2196, "learning_rate": 4.5404597826679824e-05, "epoch": 1.7905405405405406, "percentage": 44.76, "elapsed_time": "1:12:43", "remaining_time": "1:29:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 531, "total_steps": 1184, "loss": 0.2393, "learning_rate": 4.541824201802449e-05, "epoch": 1.7939189189189189, "percentage": 44.85, "elapsed_time": "1:12:48", "remaining_time": "1:29:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 532, "total_steps": 1184, "loss": 0.2469, "learning_rate": 4.543186053825081e-05, "epoch": 1.7972972972972974, "percentage": 44.93, "elapsed_time": "1:12:53", "remaining_time": "1:29:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 533, "total_steps": 1184, "loss": 0.2652, "learning_rate": 4.544545348377621e-05, "epoch": 1.8006756756756757, "percentage": 45.02, "elapsed_time": "1:12:58", "remaining_time": "1:29:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 534, "total_steps": 1184, "loss": 0.2386, "learning_rate": 4.5459020950475946e-05, "epoch": 1.804054054054054, "percentage": 45.1, "elapsed_time": "1:13:03", "remaining_time": "1:28:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 535, "total_steps": 1184, "loss": 0.5287, "learning_rate": 4.5472563033687145e-05, "epoch": 1.8074324324324325, "percentage": 45.19, "elapsed_time": "1:13:08", "remaining_time": "1:28:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 536, "total_steps": 1184, "loss": 0.2102, "learning_rate": 4.548607982821284e-05, "epoch": 1.810810810810811, "percentage": 45.27, "elapsed_time": "1:13:13", "remaining_time": "1:28:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 537, "total_steps": 1184, "loss": 0.2058, "learning_rate": 4.5499571428325935e-05, "epoch": 1.814189189189189, "percentage": 45.35, "elapsed_time": "1:13:18", "remaining_time": "1:28:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 538, "total_steps": 1184, "loss": 0.2349, "learning_rate": 4.5513037927773155e-05, "epoch": 1.8175675675675675, "percentage": 45.44, "elapsed_time": "1:13:24", "remaining_time": "1:28:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 539, "total_steps": 1184, "loss": 0.2519, "learning_rate": 4.5526479419778986e-05, "epoch": 1.820945945945946, "percentage": 45.52, "elapsed_time": "1:13:29", "remaining_time": "1:27:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 540, "total_steps": 1184, "loss": 0.2518, "learning_rate": 4.553989599704948e-05, "epoch": 1.8243243243243243, "percentage": 45.61, "elapsed_time": "1:13:34", "remaining_time": "1:27:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 541, "total_steps": 1184, "loss": 0.2341, "learning_rate": 4.555328775177616e-05, "epoch": 1.8277027027027026, "percentage": 45.69, "elapsed_time": "1:13:39", "remaining_time": "1:27:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 542, "total_steps": 1184, "loss": 0.2553, "learning_rate": 4.5566654775639785e-05, "epoch": 1.8310810810810811, "percentage": 45.78, "elapsed_time": "1:13:44", "remaining_time": "1:27:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 543, "total_steps": 1184, "loss": 0.2447, "learning_rate": 4.5579997159814117e-05, "epoch": 1.8344594594594594, "percentage": 45.86, "elapsed_time": "1:13:49", "remaining_time": "1:27:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 544, "total_steps": 1184, "loss": 0.2307, "learning_rate": 4.5593314994969665e-05, "epoch": 1.8378378378378377, "percentage": 45.95, "elapsed_time": "1:13:54", "remaining_time": "1:26:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 545, "total_steps": 1184, "loss": 0.1971, "learning_rate": 4.560660837127738e-05, "epoch": 1.8412162162162162, "percentage": 46.03, "elapsed_time": "1:14:00", "remaining_time": "1:26:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 546, "total_steps": 1184, "loss": 0.2552, "learning_rate": 4.561987737841229e-05, "epoch": 1.8445945945945947, "percentage": 46.11, "elapsed_time": "1:14:05", "remaining_time": "1:26:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 547, "total_steps": 1184, "loss": 0.2373, "learning_rate": 4.563312210555719e-05, "epoch": 1.847972972972973, "percentage": 46.2, "elapsed_time": "1:14:11", "remaining_time": "1:26:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 548, "total_steps": 1184, "loss": 0.2304, "learning_rate": 4.564634264140616e-05, "epoch": 1.8513513513513513, "percentage": 46.28, "elapsed_time": "1:14:16", "remaining_time": "1:26:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 549, "total_steps": 1184, "loss": 0.2263, "learning_rate": 4.56595390741682e-05, "epoch": 1.8547297297297298, "percentage": 46.37, "elapsed_time": "1:14:21", "remaining_time": "1:26:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 550, "total_steps": 1184, "loss": 0.218, "learning_rate": 4.567271149157073e-05, "epoch": 1.8581081081081081, "percentage": 46.45, "elapsed_time": "1:14:26", "remaining_time": "1:25:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 551, "total_steps": 1184, "loss": 0.2497, "learning_rate": 4.5685859980863086e-05, "epoch": 1.8614864864864864, "percentage": 46.54, "elapsed_time": "1:14:31", "remaining_time": "1:25:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 552, "total_steps": 1184, "loss": 0.2514, "learning_rate": 4.569898462881999e-05, "epoch": 1.864864864864865, "percentage": 46.62, "elapsed_time": "1:14:36", "remaining_time": "1:25:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 553, "total_steps": 1184, "loss": 0.2744, "learning_rate": 4.571208552174497e-05, "epoch": 1.8682432432432432, "percentage": 46.71, "elapsed_time": "1:14:41", "remaining_time": "1:25:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 554, "total_steps": 1184, "loss": 0.2712, "learning_rate": 4.572516274547383e-05, "epoch": 1.8716216216216215, "percentage": 46.79, "elapsed_time": "1:14:46", "remaining_time": "1:25:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 555, "total_steps": 1184, "loss": 0.2319, "learning_rate": 4.573821638537794e-05, "epoch": 1.875, "percentage": 46.88, "elapsed_time": "1:14:52", "remaining_time": "1:24:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 556, "total_steps": 1184, "loss": 0.2302, "learning_rate": 4.575124652636763e-05, "epoch": 1.8783783783783785, "percentage": 46.96, "elapsed_time": "1:14:57", "remaining_time": "1:24:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 557, "total_steps": 1184, "loss": 0.2413, "learning_rate": 4.5764253252895486e-05, "epoch": 1.8817567567567568, "percentage": 47.04, "elapsed_time": "1:15:02", "remaining_time": "1:24:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 558, "total_steps": 1184, "loss": 0.2477, "learning_rate": 4.577723664895965e-05, "epoch": 1.885135135135135, "percentage": 47.13, "elapsed_time": "1:15:07", "remaining_time": "1:24:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 559, "total_steps": 1184, "loss": 0.2525, "learning_rate": 4.579019679810706e-05, "epoch": 1.8885135135135136, "percentage": 47.21, "elapsed_time": "1:15:12", "remaining_time": "1:24:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 560, "total_steps": 1184, "loss": 0.2226, "learning_rate": 4.5803133783436676e-05, "epoch": 1.8918918918918919, "percentage": 47.3, "elapsed_time": "1:15:17", "remaining_time": "1:23:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 561, "total_steps": 1184, "loss": 0.2434, "learning_rate": 4.581604768760269e-05, "epoch": 1.8952702702702702, "percentage": 47.38, "elapsed_time": "1:15:23", "remaining_time": "1:23:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 562, "total_steps": 1184, "loss": 0.2287, "learning_rate": 4.582893859281769e-05, "epoch": 1.8986486486486487, "percentage": 47.47, "elapsed_time": "1:15:28", "remaining_time": "1:23:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 563, "total_steps": 1184, "loss": 0.2285, "learning_rate": 4.584180658085578e-05, "epoch": 1.902027027027027, "percentage": 47.55, "elapsed_time": "1:15:33", "remaining_time": "1:23:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 564, "total_steps": 1184, "loss": 0.2174, "learning_rate": 4.585465173305571e-05, "epoch": 1.9054054054054053, "percentage": 47.64, "elapsed_time": "1:15:38", "remaining_time": "1:23:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 565, "total_steps": 1184, "loss": 0.2482, "learning_rate": 4.5867474130323984e-05, "epoch": 1.9087837837837838, "percentage": 47.72, "elapsed_time": "1:15:43", "remaining_time": "1:22:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 566, "total_steps": 1184, "loss": 0.1858, "learning_rate": 4.588027385313786e-05, "epoch": 1.9121621621621623, "percentage": 47.8, "elapsed_time": "1:15:48", "remaining_time": "1:22:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 567, "total_steps": 1184, "loss": 0.2847, "learning_rate": 4.5893050981548446e-05, "epoch": 1.9155405405405406, "percentage": 47.89, "elapsed_time": "1:15:53", "remaining_time": "1:22:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 568, "total_steps": 1184, "loss": 0.2265, "learning_rate": 4.5905805595183656e-05, "epoch": 1.9189189189189189, "percentage": 47.97, "elapsed_time": "1:15:58", "remaining_time": "1:22:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 569, "total_steps": 1184, "loss": 0.258, "learning_rate": 4.591853777325119e-05, "epoch": 1.9222972972972974, "percentage": 48.06, "elapsed_time": "1:16:04", "remaining_time": "1:22:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 570, "total_steps": 1184, "loss": 0.2398, "learning_rate": 4.593124759454153e-05, "epoch": 1.9256756756756757, "percentage": 48.14, "elapsed_time": "1:16:09", "remaining_time": "1:22:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 571, "total_steps": 1184, "loss": 0.2292, "learning_rate": 4.5943935137430806e-05, "epoch": 1.929054054054054, "percentage": 48.23, "elapsed_time": "1:16:14", "remaining_time": "1:21:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 572, "total_steps": 1184, "loss": 0.2313, "learning_rate": 4.595660047988374e-05, "epoch": 1.9324324324324325, "percentage": 48.31, "elapsed_time": "1:16:19", "remaining_time": "1:21:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 573, "total_steps": 1184, "loss": 0.2501, "learning_rate": 4.59692436994565e-05, "epoch": 1.935810810810811, "percentage": 48.4, "elapsed_time": "1:16:24", "remaining_time": "1:21:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 574, "total_steps": 1184, "loss": 0.2099, "learning_rate": 4.5981864873299563e-05, "epoch": 1.939189189189189, "percentage": 48.48, "elapsed_time": "1:16:29", "remaining_time": "1:21:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 575, "total_steps": 1184, "loss": 0.2272, "learning_rate": 4.599446407816052e-05, "epoch": 1.9425675675675675, "percentage": 48.56, "elapsed_time": "1:16:34", "remaining_time": "1:21:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 576, "total_steps": 1184, "loss": 0.2352, "learning_rate": 4.6007041390386874e-05, "epoch": 1.945945945945946, "percentage": 48.65, "elapsed_time": "1:16:39", "remaining_time": "1:20:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 577, "total_steps": 1184, "loss": 0.2207, "learning_rate": 4.601959688592886e-05, "epoch": 1.9493243243243243, "percentage": 48.73, "elapsed_time": "1:16:44", "remaining_time": "1:20:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 578, "total_steps": 1184, "loss": 0.2437, "learning_rate": 4.603213064034216e-05, "epoch": 1.9527027027027026, "percentage": 48.82, "elapsed_time": "1:16:50", "remaining_time": "1:20:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 579, "total_steps": 1184, "loss": 0.2436, "learning_rate": 4.604464272879061e-05, "epoch": 1.9560810810810811, "percentage": 48.9, "elapsed_time": "1:16:55", "remaining_time": "1:20:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 580, "total_steps": 1184, "loss": 0.2065, "learning_rate": 4.605713322604896e-05, "epoch": 1.9594594594594594, "percentage": 48.99, "elapsed_time": "1:17:00", "remaining_time": "1:20:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 581, "total_steps": 1184, "loss": 0.2435, "learning_rate": 4.606960220650551e-05, "epoch": 1.9628378378378377, "percentage": 49.07, "elapsed_time": "1:17:05", "remaining_time": "1:20:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 582, "total_steps": 1184, "loss": 0.2456, "learning_rate": 4.608204974416481e-05, "epoch": 1.9662162162162162, "percentage": 49.16, "elapsed_time": "1:17:10", "remaining_time": "1:19:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 583, "total_steps": 1184, "loss": 0.2214, "learning_rate": 4.6094475912650234e-05, "epoch": 1.9695945945945947, "percentage": 49.24, "elapsed_time": "1:17:15", "remaining_time": "1:19:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 584, "total_steps": 1184, "loss": 0.2148, "learning_rate": 4.610688078520666e-05, "epoch": 1.972972972972973, "percentage": 49.32, "elapsed_time": "1:17:20", "remaining_time": "1:19:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 585, "total_steps": 1184, "loss": 0.2219, "learning_rate": 4.611926443470301e-05, "epoch": 1.9763513513513513, "percentage": 49.41, "elapsed_time": "1:17:25", "remaining_time": "1:19:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 586, "total_steps": 1184, "loss": 0.2153, "learning_rate": 4.6131626933634844e-05, "epoch": 1.9797297297297298, "percentage": 49.49, "elapsed_time": "1:17:31", "remaining_time": "1:19:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 587, "total_steps": 1184, "loss": 0.2459, "learning_rate": 4.6143968354126914e-05, "epoch": 1.9831081081081081, "percentage": 49.58, "elapsed_time": "1:17:36", "remaining_time": "1:18:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 588, "total_steps": 1184, "loss": 0.2339, "learning_rate": 4.6156288767935646e-05, "epoch": 1.9864864864864864, "percentage": 49.66, "elapsed_time": "1:17:41", "remaining_time": "1:18:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 589, "total_steps": 1184, "loss": 0.2109, "learning_rate": 4.61685882464517e-05, "epoch": 1.989864864864865, "percentage": 49.75, "elapsed_time": "1:17:46", "remaining_time": "1:18:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 590, "total_steps": 1184, "loss": 0.2232, "learning_rate": 4.61808668607024e-05, "epoch": 1.9932432432432432, "percentage": 49.83, "elapsed_time": "1:17:51", "remaining_time": "1:18:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 591, "total_steps": 1184, "loss": 0.2286, "learning_rate": 4.619312468135426e-05, "epoch": 1.9966216216216215, "percentage": 49.92, "elapsed_time": "1:17:56", "remaining_time": "1:18:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 592, "total_steps": 1184, "loss": 0.1979, "learning_rate": 4.620536177871533e-05, "epoch": 2.0, "percentage": 50.0, "elapsed_time": "1:18:01", "remaining_time": "1:18:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 593, "total_steps": 1184, "loss": 0.1664, "learning_rate": 4.621757822273772e-05, "epoch": 2.0033783783783785, "percentage": 50.08, "elapsed_time": "1:18:06", "remaining_time": "1:17:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 594, "total_steps": 1184, "loss": 0.1489, "learning_rate": 4.62297740830199e-05, "epoch": 2.0067567567567566, "percentage": 50.17, "elapsed_time": "1:18:12", "remaining_time": "1:17:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 595, "total_steps": 1184, "loss": 0.1666, "learning_rate": 4.6241949428809165e-05, "epoch": 2.010135135135135, "percentage": 50.25, "elapsed_time": "1:18:17", "remaining_time": "1:17:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 596, "total_steps": 1184, "loss": 0.1667, "learning_rate": 4.625410432900395e-05, "epoch": 2.0135135135135136, "percentage": 50.34, "elapsed_time": "1:18:22", "remaining_time": "1:17:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 597, "total_steps": 1184, "loss": 0.1611, "learning_rate": 4.626623885215616e-05, "epoch": 2.016891891891892, "percentage": 50.42, "elapsed_time": "1:18:27", "remaining_time": "1:17:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 598, "total_steps": 1184, "loss": 0.183, "learning_rate": 4.627835306647352e-05, "epoch": 2.02027027027027, "percentage": 50.51, "elapsed_time": "1:18:32", "remaining_time": "1:16:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 599, "total_steps": 1184, "loss": 0.1592, "learning_rate": 4.629044703982186e-05, "epoch": 2.0236486486486487, "percentage": 50.59, "elapsed_time": "1:18:37", "remaining_time": "1:16:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 600, "total_steps": 1184, "loss": 0.1459, "learning_rate": 4.63025208397274e-05, "epoch": 2.027027027027027, "percentage": 50.68, "elapsed_time": "1:18:42", "remaining_time": "1:16:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 601, "total_steps": 1184, "loss": 0.1632, "learning_rate": 4.6314574533379e-05, "epoch": 2.0304054054054053, "percentage": 50.76, "elapsed_time": "1:18:47", "remaining_time": "1:16:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 602, "total_steps": 1184, "loss": 0.1699, "learning_rate": 4.632660818763041e-05, "epoch": 2.0337837837837838, "percentage": 50.84, "elapsed_time": "1:18:52", "remaining_time": "1:16:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 603, "total_steps": 1184, "loss": 0.1725, "learning_rate": 4.633862186900253e-05, "epoch": 2.0371621621621623, "percentage": 50.93, "elapsed_time": "1:18:58", "remaining_time": "1:16:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 604, "total_steps": 1184, "loss": 0.172, "learning_rate": 4.6350615643685535e-05, "epoch": 2.0405405405405403, "percentage": 51.01, "elapsed_time": "1:19:03", "remaining_time": "1:15:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 605, "total_steps": 1184, "loss": 0.1591, "learning_rate": 4.6362589577541154e-05, "epoch": 2.043918918918919, "percentage": 51.1, "elapsed_time": "1:19:08", "remaining_time": "1:15:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 606, "total_steps": 1184, "loss": 0.1486, "learning_rate": 4.637454373610477e-05, "epoch": 2.0472972972972974, "percentage": 51.18, "elapsed_time": "1:19:13", "remaining_time": "1:15:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 607, "total_steps": 1184, "loss": 0.1521, "learning_rate": 4.638647818458763e-05, "epoch": 2.050675675675676, "percentage": 51.27, "elapsed_time": "1:19:18", "remaining_time": "1:15:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 608, "total_steps": 1184, "loss": 0.1441, "learning_rate": 4.639839298787892e-05, "epoch": 2.054054054054054, "percentage": 51.35, "elapsed_time": "1:19:23", "remaining_time": "1:15:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 609, "total_steps": 1184, "loss": 0.165, "learning_rate": 4.641028821054793e-05, "epoch": 2.0574324324324325, "percentage": 51.44, "elapsed_time": "1:19:28", "remaining_time": "1:15:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 610, "total_steps": 1184, "loss": 0.1464, "learning_rate": 4.6422163916846124e-05, "epoch": 2.060810810810811, "percentage": 51.52, "elapsed_time": "1:19:33", "remaining_time": "1:14:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 611, "total_steps": 1184, "loss": 0.1604, "learning_rate": 4.643402017070924e-05, "epoch": 2.064189189189189, "percentage": 51.6, "elapsed_time": "1:19:39", "remaining_time": "1:14:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 612, "total_steps": 1184, "loss": 0.1739, "learning_rate": 4.644585703575936e-05, "epoch": 2.0675675675675675, "percentage": 51.69, "elapsed_time": "1:19:44", "remaining_time": "1:14:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 613, "total_steps": 1184, "loss": 0.1592, "learning_rate": 4.645767457530692e-05, "epoch": 2.070945945945946, "percentage": 51.77, "elapsed_time": "1:19:49", "remaining_time": "1:14:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 614, "total_steps": 1184, "loss": 0.1591, "learning_rate": 4.64694728523528e-05, "epoch": 2.074324324324324, "percentage": 51.86, "elapsed_time": "1:19:54", "remaining_time": "1:14:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 615, "total_steps": 1184, "loss": 0.1745, "learning_rate": 4.648125192959028e-05, "epoch": 2.0777027027027026, "percentage": 51.94, "elapsed_time": "1:20:00", "remaining_time": "1:14:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 616, "total_steps": 1184, "loss": 0.1541, "learning_rate": 4.649301186940709e-05, "epoch": 2.081081081081081, "percentage": 52.03, "elapsed_time": "1:20:05", "remaining_time": "1:13:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 617, "total_steps": 1184, "loss": 0.1851, "learning_rate": 4.650475273388737e-05, "epoch": 2.0844594594594597, "percentage": 52.11, "elapsed_time": "1:20:10", "remaining_time": "1:13:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 618, "total_steps": 1184, "loss": 0.1502, "learning_rate": 4.651647458481359e-05, "epoch": 2.0878378378378377, "percentage": 52.2, "elapsed_time": "1:20:15", "remaining_time": "1:13:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 619, "total_steps": 1184, "loss": 0.1533, "learning_rate": 4.652817748366864e-05, "epoch": 2.0912162162162162, "percentage": 52.28, "elapsed_time": "1:20:20", "remaining_time": "1:13:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 620, "total_steps": 1184, "loss": 0.1704, "learning_rate": 4.653986149163757e-05, "epoch": 2.0945945945945947, "percentage": 52.36, "elapsed_time": "1:20:25", "remaining_time": "1:13:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 621, "total_steps": 1184, "loss": 0.1338, "learning_rate": 4.655152666960967e-05, "epoch": 2.097972972972973, "percentage": 52.45, "elapsed_time": "1:20:30", "remaining_time": "1:12:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 622, "total_steps": 1184, "loss": 0.1573, "learning_rate": 4.6563173078180315e-05, "epoch": 2.1013513513513513, "percentage": 52.53, "elapsed_time": "1:20:35", "remaining_time": "1:12:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 623, "total_steps": 1184, "loss": 0.1672, "learning_rate": 4.657480077765283e-05, "epoch": 2.10472972972973, "percentage": 52.62, "elapsed_time": "1:20:41", "remaining_time": "1:12:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 624, "total_steps": 1184, "loss": 0.1851, "learning_rate": 4.6586409828040405e-05, "epoch": 2.108108108108108, "percentage": 52.7, "elapsed_time": "1:20:46", "remaining_time": "1:12:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 625, "total_steps": 1184, "loss": 0.1451, "learning_rate": 4.659800028906792e-05, "epoch": 2.1114864864864864, "percentage": 52.79, "elapsed_time": "1:20:51", "remaining_time": "1:12:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 626, "total_steps": 1184, "loss": 0.1656, "learning_rate": 4.660957222017383e-05, "epoch": 2.114864864864865, "percentage": 52.87, "elapsed_time": "1:20:56", "remaining_time": "1:12:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 627, "total_steps": 1184, "loss": 0.1672, "learning_rate": 4.662112568051194e-05, "epoch": 2.1182432432432434, "percentage": 52.96, "elapsed_time": "1:21:01", "remaining_time": "1:11:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 628, "total_steps": 1184, "loss": 0.1761, "learning_rate": 4.663266072895327e-05, "epoch": 2.1216216216216215, "percentage": 53.04, "elapsed_time": "1:21:06", "remaining_time": "1:11:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 629, "total_steps": 1184, "loss": 0.1679, "learning_rate": 4.664417742408782e-05, "epoch": 2.125, "percentage": 53.12, "elapsed_time": "1:21:12", "remaining_time": "1:11:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 630, "total_steps": 1184, "loss": 0.1763, "learning_rate": 4.665567582422637e-05, "epoch": 2.1283783783783785, "percentage": 53.21, "elapsed_time": "1:21:17", "remaining_time": "1:11:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 631, "total_steps": 1184, "loss": 0.1535, "learning_rate": 4.666715598740224e-05, "epoch": 2.1317567567567566, "percentage": 53.29, "elapsed_time": "1:21:22", "remaining_time": "1:11:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 632, "total_steps": 1184, "loss": 0.1456, "learning_rate": 4.667861797137309e-05, "epoch": 2.135135135135135, "percentage": 53.38, "elapsed_time": "1:21:27", "remaining_time": "1:11:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 633, "total_steps": 1184, "loss": 0.1478, "learning_rate": 4.669006183362258e-05, "epoch": 2.1385135135135136, "percentage": 53.46, "elapsed_time": "1:21:32", "remaining_time": "1:10:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 634, "total_steps": 1184, "loss": 0.157, "learning_rate": 4.670148763136221e-05, "epoch": 2.141891891891892, "percentage": 53.55, "elapsed_time": "1:21:37", "remaining_time": "1:10:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 635, "total_steps": 1184, "loss": 0.1552, "learning_rate": 4.671289542153293e-05, "epoch": 2.14527027027027, "percentage": 53.63, "elapsed_time": "1:21:42", "remaining_time": "1:10:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 636, "total_steps": 1184, "loss": 0.1848, "learning_rate": 4.672428526080691e-05, "epoch": 2.1486486486486487, "percentage": 53.72, "elapsed_time": "1:21:47", "remaining_time": "1:10:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 637, "total_steps": 1184, "loss": 0.1803, "learning_rate": 4.673565720558918e-05, "epoch": 2.152027027027027, "percentage": 53.8, "elapsed_time": "1:21:53", "remaining_time": "1:10:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 638, "total_steps": 1184, "loss": 0.177, "learning_rate": 4.6747011312019374e-05, "epoch": 2.1554054054054053, "percentage": 53.89, "elapsed_time": "1:21:58", "remaining_time": "1:10:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 639, "total_steps": 1184, "loss": 0.164, "learning_rate": 4.6758347635973334e-05, "epoch": 2.1587837837837838, "percentage": 53.97, "elapsed_time": "1:22:03", "remaining_time": "1:09:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 640, "total_steps": 1184, "loss": 0.164, "learning_rate": 4.676966623306479e-05, "epoch": 2.1621621621621623, "percentage": 54.05, "elapsed_time": "1:22:08", "remaining_time": "1:09:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 641, "total_steps": 1184, "loss": 0.1642, "learning_rate": 4.678096715864696e-05, "epoch": 2.1655405405405403, "percentage": 54.14, "elapsed_time": "1:22:13", "remaining_time": "1:09:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 642, "total_steps": 1184, "loss": 0.155, "learning_rate": 4.679225046781422e-05, "epoch": 2.168918918918919, "percentage": 54.22, "elapsed_time": "1:22:18", "remaining_time": "1:09:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 643, "total_steps": 1184, "loss": 0.171, "learning_rate": 4.68035162154037e-05, "epoch": 2.1722972972972974, "percentage": 54.31, "elapsed_time": "1:22:23", "remaining_time": "1:09:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 644, "total_steps": 1184, "loss": 0.1692, "learning_rate": 4.681476445599687e-05, "epoch": 2.175675675675676, "percentage": 54.39, "elapsed_time": "1:22:28", "remaining_time": "1:09:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 645, "total_steps": 1184, "loss": 0.162, "learning_rate": 4.6825995243921137e-05, "epoch": 2.179054054054054, "percentage": 54.48, "elapsed_time": "1:22:33", "remaining_time": "1:08:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 646, "total_steps": 1184, "loss": 0.184, "learning_rate": 4.683720863325141e-05, "epoch": 2.1824324324324325, "percentage": 54.56, "elapsed_time": "1:22:39", "remaining_time": "1:08:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 647, "total_steps": 1184, "loss": 0.175, "learning_rate": 4.684840467781168e-05, "epoch": 2.185810810810811, "percentage": 54.65, "elapsed_time": "1:22:44", "remaining_time": "1:08:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 648, "total_steps": 1184, "loss": 0.1577, "learning_rate": 4.685958343117656e-05, "epoch": 2.189189189189189, "percentage": 54.73, "elapsed_time": "1:22:49", "remaining_time": "1:08:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 649, "total_steps": 1184, "loss": 0.1521, "learning_rate": 4.6870744946672826e-05, "epoch": 2.1925675675675675, "percentage": 54.81, "elapsed_time": "1:22:54", "remaining_time": "1:08:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 650, "total_steps": 1184, "loss": 0.1685, "learning_rate": 4.688188927738093e-05, "epoch": 2.195945945945946, "percentage": 54.9, "elapsed_time": "1:22:59", "remaining_time": "1:08:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 651, "total_steps": 1184, "loss": 0.1837, "learning_rate": 4.689301647613653e-05, "epoch": 2.199324324324324, "percentage": 54.98, "elapsed_time": "1:23:04", "remaining_time": "1:08:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 652, "total_steps": 1184, "loss": 0.174, "learning_rate": 4.6904126595532014e-05, "epoch": 2.2027027027027026, "percentage": 55.07, "elapsed_time": "1:23:09", "remaining_time": "1:07:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 653, "total_steps": 1184, "loss": 0.1741, "learning_rate": 4.69152196879179e-05, "epoch": 2.206081081081081, "percentage": 55.15, "elapsed_time": "1:23:15", "remaining_time": "1:07:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 654, "total_steps": 1184, "loss": 0.1559, "learning_rate": 4.692629580540446e-05, "epoch": 2.2094594594594597, "percentage": 55.24, "elapsed_time": "1:23:20", "remaining_time": "1:07:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 655, "total_steps": 1184, "loss": 0.1618, "learning_rate": 4.693735499986305e-05, "epoch": 2.2128378378378377, "percentage": 55.32, "elapsed_time": "1:23:25", "remaining_time": "1:07:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 656, "total_steps": 1184, "loss": 0.1478, "learning_rate": 4.694839732292767e-05, "epoch": 2.2162162162162162, "percentage": 55.41, "elapsed_time": "1:23:30", "remaining_time": "1:07:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 657, "total_steps": 1184, "loss": 0.1738, "learning_rate": 4.6959422825996345e-05, "epoch": 2.2195945945945947, "percentage": 55.49, "elapsed_time": "1:23:35", "remaining_time": "1:07:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 658, "total_steps": 1184, "loss": 0.1665, "learning_rate": 4.69704315602326e-05, "epoch": 2.222972972972973, "percentage": 55.57, "elapsed_time": "1:23:40", "remaining_time": "1:06:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 659, "total_steps": 1184, "loss": 0.1771, "learning_rate": 4.698142357656684e-05, "epoch": 2.2263513513513513, "percentage": 55.66, "elapsed_time": "1:23:45", "remaining_time": "1:06:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 660, "total_steps": 1184, "loss": 0.1591, "learning_rate": 4.6992398925697814e-05, "epoch": 2.22972972972973, "percentage": 55.74, "elapsed_time": "1:23:50", "remaining_time": "1:06:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 661, "total_steps": 1184, "loss": 0.2062, "learning_rate": 4.7003357658094e-05, "epoch": 2.233108108108108, "percentage": 55.83, "elapsed_time": "1:23:55", "remaining_time": "1:06:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 662, "total_steps": 1184, "loss": 0.1502, "learning_rate": 4.7014299823995005e-05, "epoch": 2.2364864864864864, "percentage": 55.91, "elapsed_time": "1:24:01", "remaining_time": "1:06:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 663, "total_steps": 1184, "loss": 0.1636, "learning_rate": 4.702522547341289e-05, "epoch": 2.239864864864865, "percentage": 56.0, "elapsed_time": "1:24:06", "remaining_time": "1:06:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 664, "total_steps": 1184, "loss": 0.1625, "learning_rate": 4.703613465613363e-05, "epoch": 2.2432432432432434, "percentage": 56.08, "elapsed_time": "1:24:11", "remaining_time": "1:05:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 665, "total_steps": 1184, "loss": 0.1833, "learning_rate": 4.704702742171841e-05, "epoch": 2.2466216216216215, "percentage": 56.17, "elapsed_time": "1:24:16", "remaining_time": "1:05:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 666, "total_steps": 1184, "loss": 0.1707, "learning_rate": 4.7057903819505024e-05, "epoch": 2.25, "percentage": 56.25, "elapsed_time": "1:24:21", "remaining_time": "1:05:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 667, "total_steps": 1184, "loss": 0.1508, "learning_rate": 4.7068763898609154e-05, "epoch": 2.2533783783783785, "percentage": 56.33, "elapsed_time": "1:24:27", "remaining_time": "1:05:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 668, "total_steps": 1184, "loss": 0.1786, "learning_rate": 4.707960770792576e-05, "epoch": 2.2567567567567566, "percentage": 56.42, "elapsed_time": "1:24:32", "remaining_time": "1:05:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 669, "total_steps": 1184, "loss": 0.1797, "learning_rate": 4.709043529613039e-05, "epoch": 2.260135135135135, "percentage": 56.5, "elapsed_time": "1:24:38", "remaining_time": "1:05:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 670, "total_steps": 1184, "loss": 0.1874, "learning_rate": 4.710124671168044e-05, "epoch": 2.2635135135135136, "percentage": 56.59, "elapsed_time": "1:24:43", "remaining_time": "1:04:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 671, "total_steps": 1184, "loss": 0.1897, "learning_rate": 4.711204200281654e-05, "epoch": 2.266891891891892, "percentage": 56.67, "elapsed_time": "1:24:48", "remaining_time": "1:04:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 672, "total_steps": 1184, "loss": 0.1617, "learning_rate": 4.712282121756376e-05, "epoch": 2.27027027027027, "percentage": 56.76, "elapsed_time": "1:24:53", "remaining_time": "1:04:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 673, "total_steps": 1184, "loss": 0.1652, "learning_rate": 4.713358440373295e-05, "epoch": 2.2736486486486487, "percentage": 56.84, "elapsed_time": "1:24:58", "remaining_time": "1:04:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 674, "total_steps": 1184, "loss": 0.1872, "learning_rate": 4.7144331608922e-05, "epoch": 2.277027027027027, "percentage": 56.93, "elapsed_time": "1:25:04", "remaining_time": "1:04:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 675, "total_steps": 1184, "loss": 0.1603, "learning_rate": 4.715506288051709e-05, "epoch": 2.2804054054054053, "percentage": 57.01, "elapsed_time": "1:25:09", "remaining_time": "1:04:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 676, "total_steps": 1184, "loss": 0.1689, "learning_rate": 4.7165778265693935e-05, "epoch": 2.2837837837837838, "percentage": 57.09, "elapsed_time": "1:25:14", "remaining_time": "1:04:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 677, "total_steps": 1184, "loss": 0.1804, "learning_rate": 4.7176477811419076e-05, "epoch": 2.2871621621621623, "percentage": 57.18, "elapsed_time": "1:25:20", "remaining_time": "1:03:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 678, "total_steps": 1184, "loss": 0.1811, "learning_rate": 4.718716156445106e-05, "epoch": 2.2905405405405403, "percentage": 57.26, "elapsed_time": "1:25:25", "remaining_time": "1:03:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 679, "total_steps": 1184, "loss": 0.1805, "learning_rate": 4.7197829571341704e-05, "epoch": 2.293918918918919, "percentage": 57.35, "elapsed_time": "1:25:30", "remaining_time": "1:03:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 680, "total_steps": 1184, "loss": 0.1726, "learning_rate": 4.720848187843727e-05, "epoch": 2.2972972972972974, "percentage": 57.43, "elapsed_time": "1:25:35", "remaining_time": "1:03:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 681, "total_steps": 1184, "loss": 0.1663, "learning_rate": 4.721911853187975e-05, "epoch": 2.3006756756756754, "percentage": 57.52, "elapsed_time": "1:25:40", "remaining_time": "1:03:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 682, "total_steps": 1184, "loss": 0.1637, "learning_rate": 4.722973957760799e-05, "epoch": 2.304054054054054, "percentage": 57.6, "elapsed_time": "1:25:45", "remaining_time": "1:03:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 683, "total_steps": 1184, "loss": 0.178, "learning_rate": 4.724034506135888e-05, "epoch": 2.3074324324324325, "percentage": 57.69, "elapsed_time": "1:25:50", "remaining_time": "1:02:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 684, "total_steps": 1184, "loss": 0.1725, "learning_rate": 4.725093502866861e-05, "epoch": 2.310810810810811, "percentage": 57.77, "elapsed_time": "1:25:55", "remaining_time": "1:02:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 685, "total_steps": 1184, "loss": 0.161, "learning_rate": 4.7261509524873764e-05, "epoch": 2.314189189189189, "percentage": 57.85, "elapsed_time": "1:26:01", "remaining_time": "1:02:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 686, "total_steps": 1184, "loss": 0.1757, "learning_rate": 4.727206859511253e-05, "epoch": 2.3175675675675675, "percentage": 57.94, "elapsed_time": "1:26:06", "remaining_time": "1:02:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 687, "total_steps": 1184, "loss": 0.1975, "learning_rate": 4.7282612284325846e-05, "epoch": 2.320945945945946, "percentage": 58.02, "elapsed_time": "1:26:11", "remaining_time": "1:02:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 688, "total_steps": 1184, "loss": 0.1753, "learning_rate": 4.729314063725853e-05, "epoch": 2.3243243243243246, "percentage": 58.11, "elapsed_time": "1:26:16", "remaining_time": "1:02:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 689, "total_steps": 1184, "loss": 0.1959, "learning_rate": 4.730365369846044e-05, "epoch": 2.3277027027027026, "percentage": 58.19, "elapsed_time": "1:26:21", "remaining_time": "1:02:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 690, "total_steps": 1184, "loss": 0.1779, "learning_rate": 4.7314151512287594e-05, "epoch": 2.331081081081081, "percentage": 58.28, "elapsed_time": "1:26:26", "remaining_time": "1:01:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 691, "total_steps": 1184, "loss": 0.1647, "learning_rate": 4.732463412290331e-05, "epoch": 2.3344594594594597, "percentage": 58.36, "elapsed_time": "1:26:31", "remaining_time": "1:01:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 692, "total_steps": 1184, "loss": 0.1699, "learning_rate": 4.73351015742793e-05, "epoch": 2.3378378378378377, "percentage": 58.45, "elapsed_time": "1:26:36", "remaining_time": "1:01:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 693, "total_steps": 1184, "loss": 0.1785, "learning_rate": 4.7345553910196785e-05, "epoch": 2.3412162162162162, "percentage": 58.53, "elapsed_time": "1:26:42", "remaining_time": "1:01:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 694, "total_steps": 1184, "loss": 0.1806, "learning_rate": 4.735599117424759e-05, "epoch": 2.3445945945945947, "percentage": 58.61, "elapsed_time": "1:26:47", "remaining_time": "1:01:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 695, "total_steps": 1184, "loss": 0.1689, "learning_rate": 4.7366413409835235e-05, "epoch": 2.347972972972973, "percentage": 58.7, "elapsed_time": "1:26:52", "remaining_time": "1:01:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 696, "total_steps": 1184, "loss": 0.1757, "learning_rate": 4.737682066017604e-05, "epoch": 2.3513513513513513, "percentage": 58.78, "elapsed_time": "1:26:57", "remaining_time": "1:00:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 697, "total_steps": 1184, "loss": 0.1421, "learning_rate": 4.7387212968300166e-05, "epoch": 2.35472972972973, "percentage": 58.87, "elapsed_time": "1:27:02", "remaining_time": "1:00:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 698, "total_steps": 1184, "loss": 0.156, "learning_rate": 4.7397590377052686e-05, "epoch": 2.358108108108108, "percentage": 58.95, "elapsed_time": "1:27:07", "remaining_time": "1:00:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 699, "total_steps": 1184, "loss": 0.433, "learning_rate": 4.74079529290947e-05, "epoch": 2.3614864864864864, "percentage": 59.04, "elapsed_time": "1:27:12", "remaining_time": "1:00:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 700, "total_steps": 1184, "loss": 0.1738, "learning_rate": 4.741830066690428e-05, "epoch": 2.364864864864865, "percentage": 59.12, "elapsed_time": "1:27:17", "remaining_time": "1:00:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 701, "total_steps": 1184, "loss": 0.1859, "learning_rate": 4.742863363277765e-05, "epoch": 2.3682432432432434, "percentage": 59.21, "elapsed_time": "1:27:23", "remaining_time": "1:00:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 702, "total_steps": 1184, "loss": 0.1699, "learning_rate": 4.743895186883009e-05, "epoch": 2.3716216216216215, "percentage": 59.29, "elapsed_time": "1:27:28", "remaining_time": "1:00:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 703, "total_steps": 1184, "loss": 0.2042, "learning_rate": 4.7449255416997075e-05, "epoch": 2.375, "percentage": 59.38, "elapsed_time": "1:27:33", "remaining_time": "0:59:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 704, "total_steps": 1184, "loss": 0.1626, "learning_rate": 4.7459544319035206e-05, "epoch": 2.3783783783783785, "percentage": 59.46, "elapsed_time": "1:27:38", "remaining_time": "0:59:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 705, "total_steps": 1184, "loss": 0.1524, "learning_rate": 4.746981861652332e-05, "epoch": 2.3817567567567566, "percentage": 59.54, "elapsed_time": "1:27:43", "remaining_time": "0:59:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 706, "total_steps": 1184, "loss": 0.1965, "learning_rate": 4.74800783508634e-05, "epoch": 2.385135135135135, "percentage": 59.63, "elapsed_time": "1:27:48", "remaining_time": "0:59:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 707, "total_steps": 1184, "loss": 0.1703, "learning_rate": 4.7490323563281665e-05, "epoch": 2.3885135135135136, "percentage": 59.71, "elapsed_time": "1:27:53", "remaining_time": "0:59:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 708, "total_steps": 1184, "loss": 0.1468, "learning_rate": 4.750055429482949e-05, "epoch": 2.391891891891892, "percentage": 59.8, "elapsed_time": "1:27:58", "remaining_time": "0:59:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 709, "total_steps": 1184, "loss": 0.1959, "learning_rate": 4.751077058638445e-05, "epoch": 2.39527027027027, "percentage": 59.88, "elapsed_time": "1:28:04", "remaining_time": "0:59:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 710, "total_steps": 1184, "loss": 0.1876, "learning_rate": 4.752097247865126e-05, "epoch": 2.3986486486486487, "percentage": 59.97, "elapsed_time": "1:28:09", "remaining_time": "0:58:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 711, "total_steps": 1184, "loss": 0.1567, "learning_rate": 4.753116001216277e-05, "epoch": 2.402027027027027, "percentage": 60.05, "elapsed_time": "1:28:14", "remaining_time": "0:58:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 712, "total_steps": 1184, "loss": 0.171, "learning_rate": 4.7541333227280944e-05, "epoch": 2.4054054054054053, "percentage": 60.14, "elapsed_time": "1:28:19", "remaining_time": "0:58:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 713, "total_steps": 1184, "loss": 0.1973, "learning_rate": 4.755149216419776e-05, "epoch": 2.4087837837837838, "percentage": 60.22, "elapsed_time": "1:28:24", "remaining_time": "0:58:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 714, "total_steps": 1184, "loss": 0.1804, "learning_rate": 4.756163686293624e-05, "epoch": 2.4121621621621623, "percentage": 60.3, "elapsed_time": "1:28:29", "remaining_time": "0:58:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 715, "total_steps": 1184, "loss": 0.1913, "learning_rate": 4.7571767363351344e-05, "epoch": 2.4155405405405403, "percentage": 60.39, "elapsed_time": "1:28:34", "remaining_time": "0:58:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 716, "total_steps": 1184, "loss": 0.1852, "learning_rate": 4.758188370513093e-05, "epoch": 2.418918918918919, "percentage": 60.47, "elapsed_time": "1:28:39", "remaining_time": "0:57:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 717, "total_steps": 1184, "loss": 0.1925, "learning_rate": 4.759198592779667e-05, "epoch": 2.4222972972972974, "percentage": 60.56, "elapsed_time": "1:28:45", "remaining_time": "0:57:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 718, "total_steps": 1184, "loss": 0.1821, "learning_rate": 4.760207407070501e-05, "epoch": 2.4256756756756754, "percentage": 60.64, "elapsed_time": "1:28:50", "remaining_time": "0:57:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 719, "total_steps": 1184, "loss": 0.1837, "learning_rate": 4.761214817304805e-05, "epoch": 2.429054054054054, "percentage": 60.73, "elapsed_time": "1:28:55", "remaining_time": "0:57:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 720, "total_steps": 1184, "loss": 0.1685, "learning_rate": 4.762220827385448e-05, "epoch": 2.4324324324324325, "percentage": 60.81, "elapsed_time": "1:29:00", "remaining_time": "0:57:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 721, "total_steps": 1184, "loss": 0.432, "learning_rate": 4.763225441199049e-05, "epoch": 2.435810810810811, "percentage": 60.9, "elapsed_time": "1:29:05", "remaining_time": "0:57:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 722, "total_steps": 1184, "loss": 0.1847, "learning_rate": 4.7642286626160654e-05, "epoch": 2.439189189189189, "percentage": 60.98, "elapsed_time": "1:29:10", "remaining_time": "0:57:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 723, "total_steps": 1184, "loss": 0.1786, "learning_rate": 4.765230495490885e-05, "epoch": 2.4425675675675675, "percentage": 61.06, "elapsed_time": "1:29:15", "remaining_time": "0:56:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 724, "total_steps": 1184, "loss": 0.189, "learning_rate": 4.7662309436619115e-05, "epoch": 2.445945945945946, "percentage": 61.15, "elapsed_time": "1:29:20", "remaining_time": "0:56:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 725, "total_steps": 1184, "loss": 0.1794, "learning_rate": 4.7672300109516563e-05, "epoch": 2.4493243243243246, "percentage": 61.23, "elapsed_time": "1:29:26", "remaining_time": "0:56:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 726, "total_steps": 1184, "loss": 0.1666, "learning_rate": 4.768227701166823e-05, "epoch": 2.4527027027027026, "percentage": 61.32, "elapsed_time": "1:29:31", "remaining_time": "0:56:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 727, "total_steps": 1184, "loss": 0.1695, "learning_rate": 4.7692240180983964e-05, "epoch": 2.456081081081081, "percentage": 61.4, "elapsed_time": "1:29:36", "remaining_time": "0:56:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 728, "total_steps": 1184, "loss": 0.1519, "learning_rate": 4.770218965521729e-05, "epoch": 2.4594594594594597, "percentage": 61.49, "elapsed_time": "1:29:41", "remaining_time": "0:56:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 729, "total_steps": 1184, "loss": 0.1696, "learning_rate": 4.7712125471966245e-05, "epoch": 2.4628378378378377, "percentage": 61.57, "elapsed_time": "1:29:46", "remaining_time": "0:56:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 730, "total_steps": 1184, "loss": 0.174, "learning_rate": 4.7722047668674267e-05, "epoch": 2.4662162162162162, "percentage": 61.66, "elapsed_time": "1:29:51", "remaining_time": "0:55:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 731, "total_steps": 1184, "loss": 0.1696, "learning_rate": 4.7731956282631004e-05, "epoch": 2.4695945945945947, "percentage": 61.74, "elapsed_time": "1:29:56", "remaining_time": "0:55:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 732, "total_steps": 1184, "loss": 0.1731, "learning_rate": 4.77418513509732e-05, "epoch": 2.472972972972973, "percentage": 61.82, "elapsed_time": "1:30:01", "remaining_time": "0:55:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 733, "total_steps": 1184, "loss": 0.1787, "learning_rate": 4.775173291068547e-05, "epoch": 2.4763513513513513, "percentage": 61.91, "elapsed_time": "1:30:07", "remaining_time": "0:55:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 734, "total_steps": 1184, "loss": 0.1753, "learning_rate": 4.776160099860117e-05, "epoch": 2.47972972972973, "percentage": 61.99, "elapsed_time": "1:30:12", "remaining_time": "0:55:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 735, "total_steps": 1184, "loss": 0.1766, "learning_rate": 4.777145565140325e-05, "epoch": 2.483108108108108, "percentage": 62.08, "elapsed_time": "1:30:17", "remaining_time": "0:55:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 736, "total_steps": 1184, "loss": 0.1857, "learning_rate": 4.7781296905624986e-05, "epoch": 2.4864864864864864, "percentage": 62.16, "elapsed_time": "1:30:22", "remaining_time": "0:55:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 737, "total_steps": 1184, "loss": 0.1515, "learning_rate": 4.779112479765086e-05, "epoch": 2.489864864864865, "percentage": 62.25, "elapsed_time": "1:30:27", "remaining_time": "0:54:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 738, "total_steps": 1184, "loss": 0.1908, "learning_rate": 4.780093936371736e-05, "epoch": 2.4932432432432434, "percentage": 62.33, "elapsed_time": "1:30:32", "remaining_time": "0:54:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 739, "total_steps": 1184, "loss": 0.1812, "learning_rate": 4.781074063991376e-05, "epoch": 2.4966216216216215, "percentage": 62.42, "elapsed_time": "1:30:37", "remaining_time": "0:54:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 740, "total_steps": 1184, "loss": 0.1505, "learning_rate": 4.782052866218294e-05, "epoch": 2.5, "percentage": 62.5, "elapsed_time": "1:30:43", "remaining_time": "0:54:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 741, "total_steps": 1184, "loss": 0.1656, "learning_rate": 4.783030346632214e-05, "epoch": 2.5033783783783785, "percentage": 62.58, "elapsed_time": "1:30:48", "remaining_time": "0:54:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 742, "total_steps": 1184, "loss": 0.181, "learning_rate": 4.7840065087983786e-05, "epoch": 2.506756756756757, "percentage": 62.67, "elapsed_time": "1:30:53", "remaining_time": "0:54:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 743, "total_steps": 1184, "loss": 0.201, "learning_rate": 4.784981356267626e-05, "epoch": 2.510135135135135, "percentage": 62.75, "elapsed_time": "1:30:58", "remaining_time": "0:53:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 744, "total_steps": 1184, "loss": 0.1676, "learning_rate": 4.785954892576465e-05, "epoch": 2.5135135135135136, "percentage": 62.84, "elapsed_time": "1:31:03", "remaining_time": "0:53:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 745, "total_steps": 1184, "loss": 0.1807, "learning_rate": 4.7869271212471554e-05, "epoch": 2.516891891891892, "percentage": 62.92, "elapsed_time": "1:31:08", "remaining_time": "0:53:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 746, "total_steps": 1184, "loss": 0.1639, "learning_rate": 4.7878980457877814e-05, "epoch": 2.52027027027027, "percentage": 63.01, "elapsed_time": "1:31:13", "remaining_time": "0:53:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 747, "total_steps": 1184, "loss": 0.1844, "learning_rate": 4.7888676696923315e-05, "epoch": 2.5236486486486487, "percentage": 63.09, "elapsed_time": "1:31:18", "remaining_time": "0:53:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 748, "total_steps": 1184, "loss": 0.1536, "learning_rate": 4.7898359964407695e-05, "epoch": 2.527027027027027, "percentage": 63.18, "elapsed_time": "1:31:24", "remaining_time": "0:53:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 749, "total_steps": 1184, "loss": 0.1706, "learning_rate": 4.790803029499111e-05, "epoch": 2.5304054054054053, "percentage": 63.26, "elapsed_time": "1:31:29", "remaining_time": "0:53:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 750, "total_steps": 1184, "loss": 0.4571, "learning_rate": 4.7917687723195004e-05, "epoch": 2.5337837837837838, "percentage": 63.34, "elapsed_time": "1:31:34", "remaining_time": "0:52:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 751, "total_steps": 1184, "loss": 0.1907, "learning_rate": 4.792733228340281e-05, "epoch": 2.5371621621621623, "percentage": 63.43, "elapsed_time": "1:44:27", "remaining_time": "1:00:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 752, "total_steps": 1184, "loss": 0.163, "learning_rate": 4.793696400986071e-05, "epoch": 2.5405405405405403, "percentage": 63.51, "elapsed_time": "1:44:33", "remaining_time": "1:00:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 753, "total_steps": 1184, "loss": 0.2019, "learning_rate": 4.7946582936678344e-05, "epoch": 2.543918918918919, "percentage": 63.6, "elapsed_time": "1:44:38", "remaining_time": "0:59:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 754, "total_steps": 1184, "loss": 0.158, "learning_rate": 4.795618909782957e-05, "epoch": 2.5472972972972974, "percentage": 63.68, "elapsed_time": "1:44:43", "remaining_time": "0:59:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 755, "total_steps": 1184, "loss": 0.1769, "learning_rate": 4.796578252715314e-05, "epoch": 2.5506756756756754, "percentage": 63.77, "elapsed_time": "1:44:48", "remaining_time": "0:59:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 756, "total_steps": 1184, "loss": 0.17, "learning_rate": 4.797536325835345e-05, "epoch": 2.554054054054054, "percentage": 63.85, "elapsed_time": "1:44:53", "remaining_time": "0:59:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 757, "total_steps": 1184, "loss": 0.2163, "learning_rate": 4.7984931325001216e-05, "epoch": 2.5574324324324325, "percentage": 63.94, "elapsed_time": "1:44:58", "remaining_time": "0:59:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 758, "total_steps": 1184, "loss": 0.2086, "learning_rate": 4.799448676053423e-05, "epoch": 2.560810810810811, "percentage": 64.02, "elapsed_time": "1:45:03", "remaining_time": "0:59:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 759, "total_steps": 1184, "loss": 0.1884, "learning_rate": 4.800402959825802e-05, "epoch": 2.564189189189189, "percentage": 64.1, "elapsed_time": "1:45:08", "remaining_time": "0:58:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 760, "total_steps": 1184, "loss": 0.2024, "learning_rate": 4.801355987134653e-05, "epoch": 2.5675675675675675, "percentage": 64.19, "elapsed_time": "1:45:13", "remaining_time": "0:58:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 761, "total_steps": 1184, "loss": 0.1961, "learning_rate": 4.802307761284289e-05, "epoch": 2.570945945945946, "percentage": 64.27, "elapsed_time": "1:45:18", "remaining_time": "0:58:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 762, "total_steps": 1184, "loss": 0.1957, "learning_rate": 4.8032582855660014e-05, "epoch": 2.5743243243243246, "percentage": 64.36, "elapsed_time": "1:45:24", "remaining_time": "0:58:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 763, "total_steps": 1184, "loss": 0.1931, "learning_rate": 4.8042075632581346e-05, "epoch": 2.5777027027027026, "percentage": 64.44, "elapsed_time": "1:45:29", "remaining_time": "0:58:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 764, "total_steps": 1184, "loss": 0.1788, "learning_rate": 4.80515559762615e-05, "epoch": 2.581081081081081, "percentage": 64.53, "elapsed_time": "1:45:34", "remaining_time": "0:58:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 765, "total_steps": 1184, "loss": 0.1817, "learning_rate": 4.8061023919226964e-05, "epoch": 2.5844594594594597, "percentage": 64.61, "elapsed_time": "1:45:39", "remaining_time": "0:57:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 766, "total_steps": 1184, "loss": 0.1831, "learning_rate": 4.807047949387674e-05, "epoch": 2.5878378378378377, "percentage": 64.7, "elapsed_time": "1:45:44", "remaining_time": "0:57:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 767, "total_steps": 1184, "loss": 0.1683, "learning_rate": 4.807992273248302e-05, "epoch": 2.5912162162162162, "percentage": 64.78, "elapsed_time": "1:45:49", "remaining_time": "0:57:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 768, "total_steps": 1184, "loss": 0.1904, "learning_rate": 4.808935366719187e-05, "epoch": 2.5945945945945947, "percentage": 64.86, "elapsed_time": "1:45:54", "remaining_time": "0:57:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 769, "total_steps": 1184, "loss": 0.1742, "learning_rate": 4.8098772330023855e-05, "epoch": 2.597972972972973, "percentage": 64.95, "elapsed_time": "1:45:59", "remaining_time": "0:57:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 770, "total_steps": 1184, "loss": 0.1727, "learning_rate": 4.81081787528747e-05, "epoch": 2.6013513513513513, "percentage": 65.03, "elapsed_time": "1:46:04", "remaining_time": "0:57:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 771, "total_steps": 1184, "loss": 0.1904, "learning_rate": 4.811757296751595e-05, "epoch": 2.60472972972973, "percentage": 65.12, "elapsed_time": "1:46:09", "remaining_time": "0:56:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 772, "total_steps": 1184, "loss": 0.1931, "learning_rate": 4.812695500559561e-05, "epoch": 2.608108108108108, "percentage": 65.2, "elapsed_time": "1:46:15", "remaining_time": "0:56:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 773, "total_steps": 1184, "loss": 0.2105, "learning_rate": 4.8136324898638756e-05, "epoch": 2.6114864864864864, "percentage": 65.29, "elapsed_time": "1:46:20", "remaining_time": "0:56:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 774, "total_steps": 1184, "loss": 0.1831, "learning_rate": 4.8145682678048214e-05, "epoch": 2.614864864864865, "percentage": 65.37, "elapsed_time": "1:46:25", "remaining_time": "0:56:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 775, "total_steps": 1184, "loss": 0.1975, "learning_rate": 4.815502837510518e-05, "epoch": 2.618243243243243, "percentage": 65.46, "elapsed_time": "1:46:30", "remaining_time": "0:56:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 776, "total_steps": 1184, "loss": 0.1744, "learning_rate": 4.816436202096981e-05, "epoch": 2.6216216216216215, "percentage": 65.54, "elapsed_time": "1:46:35", "remaining_time": "0:56:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 777, "total_steps": 1184, "loss": 0.1782, "learning_rate": 4.81736836466819e-05, "epoch": 2.625, "percentage": 65.62, "elapsed_time": "1:46:40", "remaining_time": "0:55:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 778, "total_steps": 1184, "loss": 0.1941, "learning_rate": 4.8182993283161485e-05, "epoch": 2.6283783783783785, "percentage": 65.71, "elapsed_time": "1:46:45", "remaining_time": "0:55:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 779, "total_steps": 1184, "loss": 0.1681, "learning_rate": 4.819229096120941e-05, "epoch": 2.631756756756757, "percentage": 65.79, "elapsed_time": "1:46:50", "remaining_time": "0:55:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 780, "total_steps": 1184, "loss": 0.1941, "learning_rate": 4.820157671150801e-05, "epoch": 2.635135135135135, "percentage": 65.88, "elapsed_time": "1:46:56", "remaining_time": "0:55:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 781, "total_steps": 1184, "loss": 0.1744, "learning_rate": 4.821085056462168e-05, "epoch": 2.6385135135135136, "percentage": 65.96, "elapsed_time": "1:47:01", "remaining_time": "0:55:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 782, "total_steps": 1184, "loss": 0.1803, "learning_rate": 4.822011255099747e-05, "epoch": 2.641891891891892, "percentage": 66.05, "elapsed_time": "1:47:06", "remaining_time": "0:55:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 783, "total_steps": 1184, "loss": 0.1651, "learning_rate": 4.8229362700965726e-05, "epoch": 2.64527027027027, "percentage": 66.13, "elapsed_time": "1:47:11", "remaining_time": "0:54:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 784, "total_steps": 1184, "loss": 0.183, "learning_rate": 4.8238601044740645e-05, "epoch": 2.6486486486486487, "percentage": 66.22, "elapsed_time": "1:47:16", "remaining_time": "0:54:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 785, "total_steps": 1184, "loss": 0.1637, "learning_rate": 4.824782761242088e-05, "epoch": 2.652027027027027, "percentage": 66.3, "elapsed_time": "1:47:21", "remaining_time": "0:54:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 786, "total_steps": 1184, "loss": 0.18, "learning_rate": 4.8257042433990135e-05, "epoch": 2.6554054054054053, "percentage": 66.39, "elapsed_time": "1:47:26", "remaining_time": "0:54:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 787, "total_steps": 1184, "loss": 0.1886, "learning_rate": 4.826624553931775e-05, "epoch": 2.6587837837837838, "percentage": 66.47, "elapsed_time": "1:47:31", "remaining_time": "0:54:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 788, "total_steps": 1184, "loss": 0.1718, "learning_rate": 4.827543695815926e-05, "epoch": 2.6621621621621623, "percentage": 66.55, "elapsed_time": "1:47:36", "remaining_time": "0:54:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 789, "total_steps": 1184, "loss": 0.1698, "learning_rate": 4.8284616720157006e-05, "epoch": 2.6655405405405403, "percentage": 66.64, "elapsed_time": "1:47:42", "remaining_time": "0:53:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 790, "total_steps": 1184, "loss": 0.1885, "learning_rate": 4.82937848548407e-05, "epoch": 2.668918918918919, "percentage": 66.72, "elapsed_time": "1:47:47", "remaining_time": "0:53:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 791, "total_steps": 1184, "loss": 0.1891, "learning_rate": 4.8302941391627947e-05, "epoch": 2.6722972972972974, "percentage": 66.81, "elapsed_time": "1:47:52", "remaining_time": "0:53:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 792, "total_steps": 1184, "loss": 0.1888, "learning_rate": 4.83120863598249e-05, "epoch": 2.6756756756756754, "percentage": 66.89, "elapsed_time": "1:47:57", "remaining_time": "0:53:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 793, "total_steps": 1184, "loss": 0.1842, "learning_rate": 4.832121978862673e-05, "epoch": 2.679054054054054, "percentage": 66.98, "elapsed_time": "1:48:02", "remaining_time": "0:53:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 794, "total_steps": 1184, "loss": 0.1681, "learning_rate": 4.8330341707118276e-05, "epoch": 2.6824324324324325, "percentage": 67.06, "elapsed_time": "1:48:07", "remaining_time": "0:53:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 795, "total_steps": 1184, "loss": 0.1756, "learning_rate": 4.833945214427451e-05, "epoch": 2.685810810810811, "percentage": 67.15, "elapsed_time": "1:48:12", "remaining_time": "0:52:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 796, "total_steps": 1184, "loss": 0.2146, "learning_rate": 4.834855112896116e-05, "epoch": 2.689189189189189, "percentage": 67.23, "elapsed_time": "1:48:17", "remaining_time": "0:52:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 797, "total_steps": 1184, "loss": 0.1851, "learning_rate": 4.835763868993521e-05, "epoch": 2.6925675675675675, "percentage": 67.31, "elapsed_time": "1:48:23", "remaining_time": "0:52:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 798, "total_steps": 1184, "loss": 0.1809, "learning_rate": 4.8366714855845496e-05, "epoch": 2.695945945945946, "percentage": 67.4, "elapsed_time": "1:48:28", "remaining_time": "0:52:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 799, "total_steps": 1184, "loss": 0.1887, "learning_rate": 4.837577965523319e-05, "epoch": 2.6993243243243246, "percentage": 67.48, "elapsed_time": "1:48:33", "remaining_time": "0:52:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 800, "total_steps": 1184, "loss": 0.1732, "learning_rate": 4.8384833116532396e-05, "epoch": 2.7027027027027026, "percentage": 67.57, "elapsed_time": "1:48:38", "remaining_time": "0:52:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 801, "total_steps": 1184, "loss": 0.1952, "learning_rate": 4.8393875268070636e-05, "epoch": 2.706081081081081, "percentage": 67.65, "elapsed_time": "1:48:43", "remaining_time": "0:51:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 802, "total_steps": 1184, "loss": 0.1903, "learning_rate": 4.84029061380694e-05, "epoch": 2.7094594594594597, "percentage": 67.74, "elapsed_time": "1:48:48", "remaining_time": "0:51:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 803, "total_steps": 1184, "loss": 0.2035, "learning_rate": 4.841192575464469e-05, "epoch": 2.7128378378378377, "percentage": 67.82, "elapsed_time": "1:48:53", "remaining_time": "0:51:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 804, "total_steps": 1184, "loss": 0.2002, "learning_rate": 4.842093414580753e-05, "epoch": 2.7162162162162162, "percentage": 67.91, "elapsed_time": "1:48:58", "remaining_time": "0:51:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 805, "total_steps": 1184, "loss": 0.2299, "learning_rate": 4.842993133946448e-05, "epoch": 2.7195945945945947, "percentage": 67.99, "elapsed_time": "1:49:03", "remaining_time": "0:51:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 806, "total_steps": 1184, "loss": 0.1931, "learning_rate": 4.843891736341818e-05, "epoch": 2.722972972972973, "percentage": 68.07, "elapsed_time": "1:49:09", "remaining_time": "0:51:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 807, "total_steps": 1184, "loss": 0.2012, "learning_rate": 4.8447892245367846e-05, "epoch": 2.7263513513513513, "percentage": 68.16, "elapsed_time": "1:49:14", "remaining_time": "0:51:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 808, "total_steps": 1184, "loss": 0.1988, "learning_rate": 4.845685601290977e-05, "epoch": 2.72972972972973, "percentage": 68.24, "elapsed_time": "1:49:19", "remaining_time": "0:50:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 809, "total_steps": 1184, "loss": 0.1966, "learning_rate": 4.846580869353787e-05, "epoch": 2.733108108108108, "percentage": 68.33, "elapsed_time": "1:49:24", "remaining_time": "0:50:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 810, "total_steps": 1184, "loss": 0.1861, "learning_rate": 4.847475031464416e-05, "epoch": 2.7364864864864864, "percentage": 68.41, "elapsed_time": "1:49:29", "remaining_time": "0:50:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 811, "total_steps": 1184, "loss": 0.2009, "learning_rate": 4.8483680903519274e-05, "epoch": 2.739864864864865, "percentage": 68.5, "elapsed_time": "1:49:34", "remaining_time": "0:50:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 812, "total_steps": 1184, "loss": 0.1692, "learning_rate": 4.8492600487352926e-05, "epoch": 2.743243243243243, "percentage": 68.58, "elapsed_time": "1:49:39", "remaining_time": "0:50:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 813, "total_steps": 1184, "loss": 0.1904, "learning_rate": 4.850150909323447e-05, "epoch": 2.7466216216216215, "percentage": 68.67, "elapsed_time": "1:49:44", "remaining_time": "0:50:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 814, "total_steps": 1184, "loss": 0.1782, "learning_rate": 4.8510406748153355e-05, "epoch": 2.75, "percentage": 68.75, "elapsed_time": "1:49:50", "remaining_time": "0:49:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 815, "total_steps": 1184, "loss": 0.1824, "learning_rate": 4.8519293478999614e-05, "epoch": 2.7533783783783785, "percentage": 68.83, "elapsed_time": "1:49:55", "remaining_time": "0:49:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 816, "total_steps": 1184, "loss": 0.1799, "learning_rate": 4.8528169312564355e-05, "epoch": 2.756756756756757, "percentage": 68.92, "elapsed_time": "1:50:00", "remaining_time": "0:49:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 817, "total_steps": 1184, "loss": 0.1792, "learning_rate": 4.8537034275540264e-05, "epoch": 2.760135135135135, "percentage": 69.0, "elapsed_time": "1:50:05", "remaining_time": "0:49:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 818, "total_steps": 1184, "loss": 0.1842, "learning_rate": 4.854588839452205e-05, "epoch": 2.7635135135135136, "percentage": 69.09, "elapsed_time": "1:50:10", "remaining_time": "0:49:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 819, "total_steps": 1184, "loss": 0.1781, "learning_rate": 4.855473169600698e-05, "epoch": 2.766891891891892, "percentage": 69.17, "elapsed_time": "1:50:15", "remaining_time": "0:49:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 820, "total_steps": 1184, "loss": 0.2129, "learning_rate": 4.856356420639528e-05, "epoch": 2.77027027027027, "percentage": 69.26, "elapsed_time": "1:50:20", "remaining_time": "0:48:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 821, "total_steps": 1184, "loss": 0.1844, "learning_rate": 4.857238595199068e-05, "epoch": 2.7736486486486487, "percentage": 69.34, "elapsed_time": "1:50:26", "remaining_time": "0:48:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 822, "total_steps": 1184, "loss": 0.1917, "learning_rate": 4.858119695900084e-05, "epoch": 2.777027027027027, "percentage": 69.43, "elapsed_time": "1:50:31", "remaining_time": "0:48:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 823, "total_steps": 1184, "loss": 0.1562, "learning_rate": 4.858999725353783e-05, "epoch": 2.7804054054054053, "percentage": 69.51, "elapsed_time": "1:50:36", "remaining_time": "0:48:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 824, "total_steps": 1184, "loss": 0.1963, "learning_rate": 4.8598786861618605e-05, "epoch": 2.7837837837837838, "percentage": 69.59, "elapsed_time": "1:50:41", "remaining_time": "0:48:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 825, "total_steps": 1184, "loss": 0.1811, "learning_rate": 4.860756580916542e-05, "epoch": 2.7871621621621623, "percentage": 69.68, "elapsed_time": "1:50:46", "remaining_time": "0:48:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 826, "total_steps": 1184, "loss": 0.1914, "learning_rate": 4.861633412200637e-05, "epoch": 2.7905405405405403, "percentage": 69.76, "elapsed_time": "1:50:51", "remaining_time": "0:48:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 827, "total_steps": 1184, "loss": 0.1587, "learning_rate": 4.862509182587578e-05, "epoch": 2.793918918918919, "percentage": 69.85, "elapsed_time": "1:50:56", "remaining_time": "0:47:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 828, "total_steps": 1184, "loss": 0.1648, "learning_rate": 4.863383894641467e-05, "epoch": 2.7972972972972974, "percentage": 69.93, "elapsed_time": "1:51:01", "remaining_time": "0:47:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 829, "total_steps": 1184, "loss": 0.1867, "learning_rate": 4.864257550917123e-05, "epoch": 2.8006756756756754, "percentage": 70.02, "elapsed_time": "1:51:07", "remaining_time": "0:47:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 830, "total_steps": 1184, "loss": 0.1789, "learning_rate": 4.865130153960124e-05, "epoch": 2.804054054054054, "percentage": 70.1, "elapsed_time": "1:51:12", "remaining_time": "0:47:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 831, "total_steps": 1184, "loss": 0.1718, "learning_rate": 4.8660017063068526e-05, "epoch": 2.8074324324324325, "percentage": 70.19, "elapsed_time": "1:51:17", "remaining_time": "0:47:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 832, "total_steps": 1184, "loss": 0.1911, "learning_rate": 4.8668722104845403e-05, "epoch": 2.810810810810811, "percentage": 70.27, "elapsed_time": "1:51:22", "remaining_time": "0:47:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 833, "total_steps": 1184, "loss": 0.1968, "learning_rate": 4.8677416690113134e-05, "epoch": 2.814189189189189, "percentage": 70.35, "elapsed_time": "1:51:27", "remaining_time": "0:46:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 834, "total_steps": 1184, "loss": 0.1612, "learning_rate": 4.868610084396232e-05, "epoch": 2.8175675675675675, "percentage": 70.44, "elapsed_time": "1:51:32", "remaining_time": "0:46:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 835, "total_steps": 1184, "loss": 0.1608, "learning_rate": 4.869477459139337e-05, "epoch": 2.820945945945946, "percentage": 70.52, "elapsed_time": "1:51:37", "remaining_time": "0:46:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 836, "total_steps": 1184, "loss": 0.1846, "learning_rate": 4.870343795731694e-05, "epoch": 2.8243243243243246, "percentage": 70.61, "elapsed_time": "1:51:42", "remaining_time": "0:46:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 837, "total_steps": 1184, "loss": 0.1954, "learning_rate": 4.8712090966554334e-05, "epoch": 2.8277027027027026, "percentage": 70.69, "elapsed_time": "1:51:48", "remaining_time": "0:46:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 838, "total_steps": 1184, "loss": 0.1875, "learning_rate": 4.872073364383795e-05, "epoch": 2.831081081081081, "percentage": 70.78, "elapsed_time": "1:51:53", "remaining_time": "0:46:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 839, "total_steps": 1184, "loss": 0.2066, "learning_rate": 4.8729366013811674e-05, "epoch": 2.8344594594594597, "percentage": 70.86, "elapsed_time": "1:51:58", "remaining_time": "0:46:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 840, "total_steps": 1184, "loss": 0.1836, "learning_rate": 4.8737988101031366e-05, "epoch": 2.8378378378378377, "percentage": 70.95, "elapsed_time": "1:52:03", "remaining_time": "0:45:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 841, "total_steps": 1184, "loss": 0.1687, "learning_rate": 4.874659992996521e-05, "epoch": 2.8412162162162162, "percentage": 71.03, "elapsed_time": "1:52:08", "remaining_time": "0:45:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 842, "total_steps": 1184, "loss": 0.2006, "learning_rate": 4.875520152499416e-05, "epoch": 2.8445945945945947, "percentage": 71.11, "elapsed_time": "1:52:13", "remaining_time": "0:45:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 843, "total_steps": 1184, "loss": 0.2175, "learning_rate": 4.876379291041238e-05, "epoch": 2.847972972972973, "percentage": 71.2, "elapsed_time": "1:52:18", "remaining_time": "0:45:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 844, "total_steps": 1184, "loss": 0.1779, "learning_rate": 4.8772374110427594e-05, "epoch": 2.8513513513513513, "percentage": 71.28, "elapsed_time": "1:52:23", "remaining_time": "0:45:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 845, "total_steps": 1184, "loss": 0.2, "learning_rate": 4.878094514916154e-05, "epoch": 2.85472972972973, "percentage": 71.37, "elapsed_time": "1:52:29", "remaining_time": "0:45:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 846, "total_steps": 1184, "loss": 0.1818, "learning_rate": 4.8789506050650396e-05, "epoch": 2.858108108108108, "percentage": 71.45, "elapsed_time": "1:52:34", "remaining_time": "0:44:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 847, "total_steps": 1184, "loss": 0.2029, "learning_rate": 4.879805683884512e-05, "epoch": 2.8614864864864864, "percentage": 71.54, "elapsed_time": "1:52:39", "remaining_time": "0:44:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 848, "total_steps": 1184, "loss": 0.1936, "learning_rate": 4.8806597537611906e-05, "epoch": 2.864864864864865, "percentage": 71.62, "elapsed_time": "1:52:44", "remaining_time": "0:44:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 849, "total_steps": 1184, "loss": 0.1765, "learning_rate": 4.881512817073255e-05, "epoch": 2.868243243243243, "percentage": 71.71, "elapsed_time": "1:52:49", "remaining_time": "0:44:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 850, "total_steps": 1184, "loss": 0.1594, "learning_rate": 4.882364876190489e-05, "epoch": 2.8716216216216215, "percentage": 71.79, "elapsed_time": "1:52:54", "remaining_time": "0:44:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 851, "total_steps": 1184, "loss": 0.1773, "learning_rate": 4.8832159334743136e-05, "epoch": 2.875, "percentage": 71.88, "elapsed_time": "1:52:59", "remaining_time": "0:44:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 852, "total_steps": 1184, "loss": 0.2057, "learning_rate": 4.884065991277833e-05, "epoch": 2.8783783783783785, "percentage": 71.96, "elapsed_time": "1:53:04", "remaining_time": "0:44:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 853, "total_steps": 1184, "loss": 0.1726, "learning_rate": 4.8849150519458726e-05, "epoch": 2.881756756756757, "percentage": 72.04, "elapsed_time": "1:53:10", "remaining_time": "0:43:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 854, "total_steps": 1184, "loss": 0.178, "learning_rate": 4.885763117815009e-05, "epoch": 2.885135135135135, "percentage": 72.13, "elapsed_time": "1:53:15", "remaining_time": "0:43:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 855, "total_steps": 1184, "loss": 0.1816, "learning_rate": 4.886610191213622e-05, "epoch": 2.8885135135135136, "percentage": 72.21, "elapsed_time": "1:53:20", "remaining_time": "0:43:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 856, "total_steps": 1184, "loss": 0.2068, "learning_rate": 4.887456274461922e-05, "epoch": 2.891891891891892, "percentage": 72.3, "elapsed_time": "1:53:25", "remaining_time": "0:43:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 857, "total_steps": 1184, "loss": 0.215, "learning_rate": 4.8883013698719973e-05, "epoch": 2.89527027027027, "percentage": 72.38, "elapsed_time": "1:53:30", "remaining_time": "0:43:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 858, "total_steps": 1184, "loss": 0.181, "learning_rate": 4.889145479747843e-05, "epoch": 2.8986486486486487, "percentage": 72.47, "elapsed_time": "1:53:35", "remaining_time": "0:43:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 859, "total_steps": 1184, "loss": 0.1878, "learning_rate": 4.889988606385404e-05, "epoch": 2.902027027027027, "percentage": 72.55, "elapsed_time": "1:53:40", "remaining_time": "0:43:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 860, "total_steps": 1184, "loss": 0.1948, "learning_rate": 4.8908307520726135e-05, "epoch": 2.9054054054054053, "percentage": 72.64, "elapsed_time": "1:53:45", "remaining_time": "0:42:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 861, "total_steps": 1184, "loss": 0.2007, "learning_rate": 4.891671919089425e-05, "epoch": 2.9087837837837838, "percentage": 72.72, "elapsed_time": "1:53:51", "remaining_time": "0:42:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 862, "total_steps": 1184, "loss": 0.1865, "learning_rate": 4.892512109707855e-05, "epoch": 2.9121621621621623, "percentage": 72.8, "elapsed_time": "1:53:56", "remaining_time": "0:42:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 863, "total_steps": 1184, "loss": 0.1831, "learning_rate": 4.893351326192016e-05, "epoch": 2.9155405405405403, "percentage": 72.89, "elapsed_time": "1:54:01", "remaining_time": "0:42:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 864, "total_steps": 1184, "loss": 0.1494, "learning_rate": 4.894189570798156e-05, "epoch": 2.918918918918919, "percentage": 72.97, "elapsed_time": "1:54:06", "remaining_time": "0:42:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 865, "total_steps": 1184, "loss": 0.2045, "learning_rate": 4.895026845774691e-05, "epoch": 2.9222972972972974, "percentage": 73.06, "elapsed_time": "1:54:11", "remaining_time": "0:42:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 866, "total_steps": 1184, "loss": 0.1818, "learning_rate": 4.895863153362244e-05, "epoch": 2.9256756756756754, "percentage": 73.14, "elapsed_time": "1:54:16", "remaining_time": "0:41:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 867, "total_steps": 1184, "loss": 0.1936, "learning_rate": 4.896698495793684e-05, "epoch": 2.929054054054054, "percentage": 73.23, "elapsed_time": "1:54:21", "remaining_time": "0:41:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 868, "total_steps": 1184, "loss": 0.1964, "learning_rate": 4.897532875294154e-05, "epoch": 2.9324324324324325, "percentage": 73.31, "elapsed_time": "1:54:26", "remaining_time": "0:41:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 869, "total_steps": 1184, "loss": 0.1737, "learning_rate": 4.8983662940811115e-05, "epoch": 2.935810810810811, "percentage": 73.4, "elapsed_time": "1:54:32", "remaining_time": "0:41:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 870, "total_steps": 1184, "loss": 0.1488, "learning_rate": 4.899198754364365e-05, "epoch": 2.939189189189189, "percentage": 73.48, "elapsed_time": "1:54:37", "remaining_time": "0:41:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 871, "total_steps": 1184, "loss": 0.1822, "learning_rate": 4.900030258346106e-05, "epoch": 2.9425675675675675, "percentage": 73.56, "elapsed_time": "1:54:42", "remaining_time": "0:41:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 872, "total_steps": 1184, "loss": 0.1846, "learning_rate": 4.900860808220946e-05, "epoch": 2.945945945945946, "percentage": 73.65, "elapsed_time": "1:54:47", "remaining_time": "0:41:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 873, "total_steps": 1184, "loss": 0.2105, "learning_rate": 4.90169040617595e-05, "epoch": 2.9493243243243246, "percentage": 73.73, "elapsed_time": "1:54:52", "remaining_time": "0:40:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 874, "total_steps": 1184, "loss": 0.1815, "learning_rate": 4.9025190543906715e-05, "epoch": 2.9527027027027026, "percentage": 73.82, "elapsed_time": "1:54:57", "remaining_time": "0:40:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 875, "total_steps": 1184, "loss": 0.1713, "learning_rate": 4.903346755037189e-05, "epoch": 2.956081081081081, "percentage": 73.9, "elapsed_time": "1:55:02", "remaining_time": "0:40:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 876, "total_steps": 1184, "loss": 0.1915, "learning_rate": 4.904173510280135e-05, "epoch": 2.9594594594594597, "percentage": 73.99, "elapsed_time": "1:55:07", "remaining_time": "0:40:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 877, "total_steps": 1184, "loss": 0.2157, "learning_rate": 4.904999322276735e-05, "epoch": 2.9628378378378377, "percentage": 74.07, "elapsed_time": "1:55:13", "remaining_time": "0:40:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 878, "total_steps": 1184, "loss": 0.1947, "learning_rate": 4.9058241931768385e-05, "epoch": 2.9662162162162162, "percentage": 74.16, "elapsed_time": "1:55:18", "remaining_time": "0:40:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 879, "total_steps": 1184, "loss": 0.1836, "learning_rate": 4.9066481251229535e-05, "epoch": 2.9695945945945947, "percentage": 74.24, "elapsed_time": "1:55:23", "remaining_time": "0:40:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 880, "total_steps": 1184, "loss": 0.4757, "learning_rate": 4.907471120250281e-05, "epoch": 2.972972972972973, "percentage": 74.32, "elapsed_time": "1:55:28", "remaining_time": "0:39:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 881, "total_steps": 1184, "loss": 0.2003, "learning_rate": 4.9082931806867474e-05, "epoch": 2.9763513513513513, "percentage": 74.41, "elapsed_time": "1:55:33", "remaining_time": "0:39:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 882, "total_steps": 1184, "loss": 0.19, "learning_rate": 4.909114308553033e-05, "epoch": 2.97972972972973, "percentage": 74.49, "elapsed_time": "1:55:38", "remaining_time": "0:39:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 883, "total_steps": 1184, "loss": 0.2071, "learning_rate": 4.909934505962615e-05, "epoch": 2.983108108108108, "percentage": 74.58, "elapsed_time": "1:55:43", "remaining_time": "0:39:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 884, "total_steps": 1184, "loss": 0.1742, "learning_rate": 4.9107537750217886e-05, "epoch": 2.9864864864864864, "percentage": 74.66, "elapsed_time": "1:55:48", "remaining_time": "0:39:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 885, "total_steps": 1184, "loss": 0.1734, "learning_rate": 4.9115721178297093e-05, "epoch": 2.989864864864865, "percentage": 74.75, "elapsed_time": "1:55:54", "remaining_time": "0:39:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 886, "total_steps": 1184, "loss": 0.1623, "learning_rate": 4.9123895364784184e-05, "epoch": 2.993243243243243, "percentage": 74.83, "elapsed_time": "1:55:59", "remaining_time": "0:39:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 887, "total_steps": 1184, "loss": 0.1647, "learning_rate": 4.913206033052877e-05, "epoch": 2.9966216216216215, "percentage": 74.92, "elapsed_time": "1:56:04", "remaining_time": "0:38:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 888, "total_steps": 1184, "loss": 0.1831, "learning_rate": 4.914021609631002e-05, "epoch": 3.0, "percentage": 75.0, "elapsed_time": "1:56:09", "remaining_time": "0:38:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 889, "total_steps": 1184, "loss": 0.128, "learning_rate": 4.91483626828369e-05, "epoch": 3.0033783783783785, "percentage": 75.08, "elapsed_time": "1:56:14", "remaining_time": "0:38:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 890, "total_steps": 1184, "loss": 0.1077, "learning_rate": 4.915650011074855e-05, "epoch": 3.0067567567567566, "percentage": 75.17, "elapsed_time": "1:56:19", "remaining_time": "0:38:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 891, "total_steps": 1184, "loss": 0.11, "learning_rate": 4.916462840061458e-05, "epoch": 3.010135135135135, "percentage": 75.25, "elapsed_time": "1:56:24", "remaining_time": "0:38:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 892, "total_steps": 1184, "loss": 0.1032, "learning_rate": 4.917274757293539e-05, "epoch": 3.0135135135135136, "percentage": 75.34, "elapsed_time": "1:56:29", "remaining_time": "0:38:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 893, "total_steps": 1184, "loss": 0.1304, "learning_rate": 4.918085764814244e-05, "epoch": 3.016891891891892, "percentage": 75.42, "elapsed_time": "1:56:35", "remaining_time": "0:37:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 894, "total_steps": 1184, "loss": 0.0949, "learning_rate": 4.9188958646598624e-05, "epoch": 3.02027027027027, "percentage": 75.51, "elapsed_time": "1:56:40", "remaining_time": "0:37:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 895, "total_steps": 1184, "loss": 0.0989, "learning_rate": 4.919705058859854e-05, "epoch": 3.0236486486486487, "percentage": 75.59, "elapsed_time": "1:56:45", "remaining_time": "0:37:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 896, "total_steps": 1184, "loss": 0.1152, "learning_rate": 4.920513349436875e-05, "epoch": 3.027027027027027, "percentage": 75.68, "elapsed_time": "1:56:50", "remaining_time": "0:37:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 897, "total_steps": 1184, "loss": 0.1163, "learning_rate": 4.92132073840682e-05, "epoch": 3.0304054054054053, "percentage": 75.76, "elapsed_time": "1:56:56", "remaining_time": "0:37:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 898, "total_steps": 1184, "loss": 0.1078, "learning_rate": 4.922127227778841e-05, "epoch": 3.0337837837837838, "percentage": 75.84, "elapsed_time": "1:57:01", "remaining_time": "0:37:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 899, "total_steps": 1184, "loss": 0.1165, "learning_rate": 4.9229328195553815e-05, "epoch": 3.0371621621621623, "percentage": 75.93, "elapsed_time": "1:57:06", "remaining_time": "0:37:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 900, "total_steps": 1184, "loss": 0.12, "learning_rate": 4.923737515732209e-05, "epoch": 3.0405405405405403, "percentage": 76.01, "elapsed_time": "1:57:11", "remaining_time": "0:36:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 901, "total_steps": 1184, "loss": 0.1131, "learning_rate": 4.924541318298438e-05, "epoch": 3.043918918918919, "percentage": 76.1, "elapsed_time": "1:57:16", "remaining_time": "0:36:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 902, "total_steps": 1184, "loss": 0.1025, "learning_rate": 4.92534422923657e-05, "epoch": 3.0472972972972974, "percentage": 76.18, "elapsed_time": "1:57:21", "remaining_time": "0:36:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 903, "total_steps": 1184, "loss": 0.1207, "learning_rate": 4.9261462505225106e-05, "epoch": 3.050675675675676, "percentage": 76.27, "elapsed_time": "1:57:26", "remaining_time": "0:36:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 904, "total_steps": 1184, "loss": 0.1115, "learning_rate": 4.926947384125606e-05, "epoch": 3.054054054054054, "percentage": 76.35, "elapsed_time": "1:57:31", "remaining_time": "0:36:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 905, "total_steps": 1184, "loss": 0.1151, "learning_rate": 4.927747632008672e-05, "epoch": 3.0574324324324325, "percentage": 76.44, "elapsed_time": "1:57:36", "remaining_time": "0:36:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 906, "total_steps": 1184, "loss": 0.113, "learning_rate": 4.9285469961280226e-05, "epoch": 3.060810810810811, "percentage": 76.52, "elapsed_time": "1:57:42", "remaining_time": "0:36:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 907, "total_steps": 1184, "loss": 0.1157, "learning_rate": 4.9293454784334924e-05, "epoch": 3.064189189189189, "percentage": 76.6, "elapsed_time": "1:57:47", "remaining_time": "0:35:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 908, "total_steps": 1184, "loss": 0.1031, "learning_rate": 4.9301430808684754e-05, "epoch": 3.0675675675675675, "percentage": 76.69, "elapsed_time": "1:57:52", "remaining_time": "0:35:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 909, "total_steps": 1184, "loss": 0.1043, "learning_rate": 4.930939805369946e-05, "epoch": 3.070945945945946, "percentage": 76.77, "elapsed_time": "1:58:00", "remaining_time": "0:35:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 910, "total_steps": 1184, "loss": 0.1109, "learning_rate": 4.93173565386849e-05, "epoch": 3.074324324324324, "percentage": 76.86, "elapsed_time": "1:58:05", "remaining_time": "0:35:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 911, "total_steps": 1184, "loss": 0.1047, "learning_rate": 4.932530628288331e-05, "epoch": 3.0777027027027026, "percentage": 76.94, "elapsed_time": "1:58:10", "remaining_time": "0:35:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 912, "total_steps": 1184, "loss": 0.0961, "learning_rate": 4.933324730547361e-05, "epoch": 3.081081081081081, "percentage": 77.03, "elapsed_time": "1:58:15", "remaining_time": "0:35:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 913, "total_steps": 1184, "loss": 0.1178, "learning_rate": 4.934117962557165e-05, "epoch": 3.0844594594594597, "percentage": 77.11, "elapsed_time": "1:58:20", "remaining_time": "0:35:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 914, "total_steps": 1184, "loss": 0.1179, "learning_rate": 4.9349103262230524e-05, "epoch": 3.0878378378378377, "percentage": 77.2, "elapsed_time": "1:58:25", "remaining_time": "0:34:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 915, "total_steps": 1184, "loss": 0.1161, "learning_rate": 4.935701823444081e-05, "epoch": 3.0912162162162162, "percentage": 77.28, "elapsed_time": "1:58:32", "remaining_time": "0:34:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 916, "total_steps": 1184, "loss": 0.1167, "learning_rate": 4.9364924561130845e-05, "epoch": 3.0945945945945947, "percentage": 77.36, "elapsed_time": "1:58:37", "remaining_time": "0:34:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 917, "total_steps": 1184, "loss": 0.1305, "learning_rate": 4.937282226116702e-05, "epoch": 3.097972972972973, "percentage": 77.45, "elapsed_time": "1:58:42", "remaining_time": "0:34:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 918, "total_steps": 1184, "loss": 0.1018, "learning_rate": 4.938071135335405e-05, "epoch": 3.1013513513513513, "percentage": 77.53, "elapsed_time": "1:58:47", "remaining_time": "0:34:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 919, "total_steps": 1184, "loss": 0.1156, "learning_rate": 4.938859185643519e-05, "epoch": 3.10472972972973, "percentage": 77.62, "elapsed_time": "1:58:53", "remaining_time": "0:34:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 920, "total_steps": 1184, "loss": 0.1157, "learning_rate": 4.939646378909259e-05, "epoch": 3.108108108108108, "percentage": 77.7, "elapsed_time": "1:58:58", "remaining_time": "0:34:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 921, "total_steps": 1184, "loss": 0.1197, "learning_rate": 4.940432716994748e-05, "epoch": 3.1114864864864864, "percentage": 77.79, "elapsed_time": "1:59:03", "remaining_time": "0:33:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 922, "total_steps": 1184, "loss": 0.1202, "learning_rate": 4.9412182017560496e-05, "epoch": 3.114864864864865, "percentage": 77.87, "elapsed_time": "1:59:09", "remaining_time": "0:33:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 923, "total_steps": 1184, "loss": 0.1126, "learning_rate": 4.942002835043187e-05, "epoch": 3.1182432432432434, "percentage": 77.96, "elapsed_time": "1:59:14", "remaining_time": "0:33:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 924, "total_steps": 1184, "loss": 0.1111, "learning_rate": 4.942786618700178e-05, "epoch": 3.1216216216216215, "percentage": 78.04, "elapsed_time": "1:59:19", "remaining_time": "0:33:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 925, "total_steps": 1184, "loss": 0.1151, "learning_rate": 4.9435695545650545e-05, "epoch": 3.125, "percentage": 78.12, "elapsed_time": "1:59:24", "remaining_time": "0:33:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 926, "total_steps": 1184, "loss": 0.1106, "learning_rate": 4.944351644469891e-05, "epoch": 3.1283783783783785, "percentage": 78.21, "elapsed_time": "1:59:30", "remaining_time": "0:33:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 927, "total_steps": 1184, "loss": 0.1239, "learning_rate": 4.945132890240829e-05, "epoch": 3.1317567567567566, "percentage": 78.29, "elapsed_time": "1:59:35", "remaining_time": "0:33:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 928, "total_steps": 1184, "loss": 0.1252, "learning_rate": 4.945913293698104e-05, "epoch": 3.135135135135135, "percentage": 78.38, "elapsed_time": "1:59:40", "remaining_time": "0:33:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 929, "total_steps": 1184, "loss": 0.107, "learning_rate": 4.9466928566560696e-05, "epoch": 3.1385135135135136, "percentage": 78.46, "elapsed_time": "1:59:45", "remaining_time": "0:32:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 930, "total_steps": 1184, "loss": 0.113, "learning_rate": 4.9474715809232256e-05, "epoch": 3.141891891891892, "percentage": 78.55, "elapsed_time": "1:59:50", "remaining_time": "0:32:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 931, "total_steps": 1184, "loss": 0.1135, "learning_rate": 4.948249468302239e-05, "epoch": 3.14527027027027, "percentage": 78.63, "elapsed_time": "1:59:55", "remaining_time": "0:32:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 932, "total_steps": 1184, "loss": 0.1051, "learning_rate": 4.9490265205899697e-05, "epoch": 3.1486486486486487, "percentage": 78.72, "elapsed_time": "2:00:00", "remaining_time": "0:32:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 933, "total_steps": 1184, "loss": 0.121, "learning_rate": 4.9498027395775006e-05, "epoch": 3.152027027027027, "percentage": 78.8, "elapsed_time": "2:00:05", "remaining_time": "0:32:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 934, "total_steps": 1184, "loss": 0.1225, "learning_rate": 4.950578127050156e-05, "epoch": 3.1554054054054053, "percentage": 78.89, "elapsed_time": "2:00:11", "remaining_time": "0:32:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 935, "total_steps": 1184, "loss": 0.1294, "learning_rate": 4.95135268478753e-05, "epoch": 3.1587837837837838, "percentage": 78.97, "elapsed_time": "2:00:16", "remaining_time": "0:32:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 936, "total_steps": 1184, "loss": 0.1229, "learning_rate": 4.952126414563509e-05, "epoch": 3.1621621621621623, "percentage": 79.05, "elapsed_time": "2:00:21", "remaining_time": "0:31:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 937, "total_steps": 1184, "loss": 0.1117, "learning_rate": 4.952899318146297e-05, "epoch": 3.1655405405405403, "percentage": 79.14, "elapsed_time": "2:00:26", "remaining_time": "0:31:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 938, "total_steps": 1184, "loss": 0.0972, "learning_rate": 4.9536713972984414e-05, "epoch": 3.168918918918919, "percentage": 79.22, "elapsed_time": "2:00:31", "remaining_time": "0:31:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 939, "total_steps": 1184, "loss": 0.1333, "learning_rate": 4.954442653776852e-05, "epoch": 3.1722972972972974, "percentage": 79.31, "elapsed_time": "2:00:36", "remaining_time": "0:31:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 940, "total_steps": 1184, "loss": 0.1114, "learning_rate": 4.955213089332832e-05, "epoch": 3.175675675675676, "percentage": 79.39, "elapsed_time": "2:00:41", "remaining_time": "0:31:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 941, "total_steps": 1184, "loss": 0.1169, "learning_rate": 4.955982705712095e-05, "epoch": 3.179054054054054, "percentage": 79.48, "elapsed_time": "2:00:47", "remaining_time": "0:31:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 942, "total_steps": 1184, "loss": 0.1005, "learning_rate": 4.956751504654796e-05, "epoch": 3.1824324324324325, "percentage": 79.56, "elapsed_time": "2:00:52", "remaining_time": "0:31:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 943, "total_steps": 1184, "loss": 0.1187, "learning_rate": 4.957519487895548e-05, "epoch": 3.185810810810811, "percentage": 79.65, "elapsed_time": "2:00:57", "remaining_time": "0:30:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 944, "total_steps": 1184, "loss": 0.1273, "learning_rate": 4.9582866571634485e-05, "epoch": 3.189189189189189, "percentage": 79.73, "elapsed_time": "2:01:02", "remaining_time": "0:30:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 945, "total_steps": 1184, "loss": 0.1125, "learning_rate": 4.959053014182106e-05, "epoch": 3.1925675675675675, "percentage": 79.81, "elapsed_time": "2:01:07", "remaining_time": "0:30:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 946, "total_steps": 1184, "loss": 0.1175, "learning_rate": 4.959818560669655e-05, "epoch": 3.195945945945946, "percentage": 79.9, "elapsed_time": "2:01:12", "remaining_time": "0:30:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 947, "total_steps": 1184, "loss": 0.1131, "learning_rate": 4.96058329833879e-05, "epoch": 3.199324324324324, "percentage": 79.98, "elapsed_time": "2:01:17", "remaining_time": "0:30:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 948, "total_steps": 1184, "loss": 0.1262, "learning_rate": 4.961347228896777e-05, "epoch": 3.2027027027027026, "percentage": 80.07, "elapsed_time": "2:01:22", "remaining_time": "0:30:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 949, "total_steps": 1184, "loss": 0.1191, "learning_rate": 4.962110354045488e-05, "epoch": 3.206081081081081, "percentage": 80.15, "elapsed_time": "2:01:27", "remaining_time": "0:30:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 950, "total_steps": 1184, "loss": 0.1182, "learning_rate": 4.962872675481414e-05, "epoch": 3.2094594594594597, "percentage": 80.24, "elapsed_time": "2:01:33", "remaining_time": "0:29:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 951, "total_steps": 1184, "loss": 0.1211, "learning_rate": 4.9636341948956906e-05, "epoch": 3.2128378378378377, "percentage": 80.32, "elapsed_time": "2:01:38", "remaining_time": "0:29:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 952, "total_steps": 1184, "loss": 0.1195, "learning_rate": 4.964394913974124e-05, "epoch": 3.2162162162162162, "percentage": 80.41, "elapsed_time": "2:01:43", "remaining_time": "0:29:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 953, "total_steps": 1184, "loss": 0.1353, "learning_rate": 4.965154834397211e-05, "epoch": 3.2195945945945947, "percentage": 80.49, "elapsed_time": "2:01:48", "remaining_time": "0:29:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 954, "total_steps": 1184, "loss": 0.1111, "learning_rate": 4.965913957840159e-05, "epoch": 3.222972972972973, "percentage": 80.57, "elapsed_time": "2:01:53", "remaining_time": "0:29:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 955, "total_steps": 1184, "loss": 0.1256, "learning_rate": 4.966672285972911e-05, "epoch": 3.2263513513513513, "percentage": 80.66, "elapsed_time": "2:01:58", "remaining_time": "0:29:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 956, "total_steps": 1184, "loss": 0.1078, "learning_rate": 4.967429820460167e-05, "epoch": 3.22972972972973, "percentage": 80.74, "elapsed_time": "2:02:03", "remaining_time": "0:29:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 957, "total_steps": 1184, "loss": 0.1313, "learning_rate": 4.9681865629614064e-05, "epoch": 3.233108108108108, "percentage": 80.83, "elapsed_time": "2:02:08", "remaining_time": "0:28:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 958, "total_steps": 1184, "loss": 0.1396, "learning_rate": 4.9689425151309074e-05, "epoch": 3.2364864864864864, "percentage": 80.91, "elapsed_time": "2:02:14", "remaining_time": "0:28:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 959, "total_steps": 1184, "loss": 0.1242, "learning_rate": 4.969697678617773e-05, "epoch": 3.239864864864865, "percentage": 81.0, "elapsed_time": "2:02:19", "remaining_time": "0:28:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 960, "total_steps": 1184, "loss": 0.1149, "learning_rate": 4.970452055065948e-05, "epoch": 3.2432432432432434, "percentage": 81.08, "elapsed_time": "2:02:24", "remaining_time": "0:28:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 961, "total_steps": 1184, "loss": 0.1074, "learning_rate": 4.9712056461142423e-05, "epoch": 3.2466216216216215, "percentage": 81.17, "elapsed_time": "2:02:29", "remaining_time": "0:28:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 962, "total_steps": 1184, "loss": 0.1152, "learning_rate": 4.971958453396355e-05, "epoch": 3.25, "percentage": 81.25, "elapsed_time": "2:02:34", "remaining_time": "0:28:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 963, "total_steps": 1184, "loss": 0.1273, "learning_rate": 4.972710478540891e-05, "epoch": 3.2533783783783785, "percentage": 81.33, "elapsed_time": "2:02:39", "remaining_time": "0:28:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 964, "total_steps": 1184, "loss": 0.1149, "learning_rate": 4.973461723171385e-05, "epoch": 3.2567567567567566, "percentage": 81.42, "elapsed_time": "2:02:44", "remaining_time": "0:28:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 965, "total_steps": 1184, "loss": 0.1301, "learning_rate": 4.9742121889063213e-05, "epoch": 3.260135135135135, "percentage": 81.5, "elapsed_time": "2:02:49", "remaining_time": "0:27:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 966, "total_steps": 1184, "loss": 0.1133, "learning_rate": 4.974961877359156e-05, "epoch": 3.2635135135135136, "percentage": 81.59, "elapsed_time": "2:02:55", "remaining_time": "0:27:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 967, "total_steps": 1184, "loss": 0.1346, "learning_rate": 4.975710790138336e-05, "epoch": 3.266891891891892, "percentage": 81.67, "elapsed_time": "2:03:00", "remaining_time": "0:27:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 968, "total_steps": 1184, "loss": 0.3884, "learning_rate": 4.976458928847323e-05, "epoch": 3.27027027027027, "percentage": 81.76, "elapsed_time": "2:03:05", "remaining_time": "0:27:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 969, "total_steps": 1184, "loss": 0.1164, "learning_rate": 4.977206295084609e-05, "epoch": 3.2736486486486487, "percentage": 81.84, "elapsed_time": "2:03:10", "remaining_time": "0:27:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 970, "total_steps": 1184, "loss": 0.1269, "learning_rate": 4.9779528904437424e-05, "epoch": 3.277027027027027, "percentage": 81.93, "elapsed_time": "2:03:15", "remaining_time": "0:27:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 971, "total_steps": 1184, "loss": 0.1121, "learning_rate": 4.978698716513342e-05, "epoch": 3.2804054054054053, "percentage": 82.01, "elapsed_time": "2:03:20", "remaining_time": "0:27:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 972, "total_steps": 1184, "loss": 0.1219, "learning_rate": 4.9794437748771244e-05, "epoch": 3.2837837837837838, "percentage": 82.09, "elapsed_time": "2:03:25", "remaining_time": "0:26:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 973, "total_steps": 1184, "loss": 0.1303, "learning_rate": 4.9801880671139204e-05, "epoch": 3.2871621621621623, "percentage": 82.18, "elapsed_time": "2:03:30", "remaining_time": "0:26:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 974, "total_steps": 1184, "loss": 0.112, "learning_rate": 4.980931594797693e-05, "epoch": 3.2905405405405403, "percentage": 82.26, "elapsed_time": "2:03:36", "remaining_time": "0:26:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 975, "total_steps": 1184, "loss": 0.1326, "learning_rate": 4.981674359497562e-05, "epoch": 3.293918918918919, "percentage": 82.35, "elapsed_time": "2:03:41", "remaining_time": "0:26:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 976, "total_steps": 1184, "loss": 0.1244, "learning_rate": 4.98241636277782e-05, "epoch": 3.2972972972972974, "percentage": 82.43, "elapsed_time": "2:03:46", "remaining_time": "0:26:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 977, "total_steps": 1184, "loss": 0.1203, "learning_rate": 4.983157606197955e-05, "epoch": 3.3006756756756754, "percentage": 82.52, "elapsed_time": "2:03:51", "remaining_time": "0:26:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 978, "total_steps": 1184, "loss": 0.1247, "learning_rate": 4.98389809131267e-05, "epoch": 3.304054054054054, "percentage": 82.6, "elapsed_time": "2:03:56", "remaining_time": "0:26:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 979, "total_steps": 1184, "loss": 0.1321, "learning_rate": 4.984637819671897e-05, "epoch": 3.3074324324324325, "percentage": 82.69, "elapsed_time": "2:04:01", "remaining_time": "0:25:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 980, "total_steps": 1184, "loss": 0.1157, "learning_rate": 4.985376792820825e-05, "epoch": 3.310810810810811, "percentage": 82.77, "elapsed_time": "2:04:06", "remaining_time": "0:25:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 981, "total_steps": 1184, "loss": 0.1103, "learning_rate": 4.986115012299915e-05, "epoch": 3.314189189189189, "percentage": 82.85, "elapsed_time": "2:04:11", "remaining_time": "0:25:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 982, "total_steps": 1184, "loss": 0.1284, "learning_rate": 4.986852479644916e-05, "epoch": 3.3175675675675675, "percentage": 82.94, "elapsed_time": "2:04:16", "remaining_time": "0:25:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 983, "total_steps": 1184, "loss": 0.1126, "learning_rate": 4.987589196386893e-05, "epoch": 3.320945945945946, "percentage": 83.02, "elapsed_time": "2:04:22", "remaining_time": "0:25:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 984, "total_steps": 1184, "loss": 0.1199, "learning_rate": 4.988325164052236e-05, "epoch": 3.3243243243243246, "percentage": 83.11, "elapsed_time": "2:04:27", "remaining_time": "0:25:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 985, "total_steps": 1184, "loss": 0.1295, "learning_rate": 4.9890603841626866e-05, "epoch": 3.3277027027027026, "percentage": 83.19, "elapsed_time": "2:04:32", "remaining_time": "0:25:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 986, "total_steps": 1184, "loss": 0.1276, "learning_rate": 4.989794858235352e-05, "epoch": 3.331081081081081, "percentage": 83.28, "elapsed_time": "2:04:37", "remaining_time": "0:25:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 987, "total_steps": 1184, "loss": 0.1355, "learning_rate": 4.990528587782729e-05, "epoch": 3.3344594594594597, "percentage": 83.36, "elapsed_time": "2:04:42", "remaining_time": "0:24:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 988, "total_steps": 1184, "loss": 0.1159, "learning_rate": 4.9912615743127146e-05, "epoch": 3.3378378378378377, "percentage": 83.45, "elapsed_time": "2:04:47", "remaining_time": "0:24:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 989, "total_steps": 1184, "loss": 0.1349, "learning_rate": 4.991993819328633e-05, "epoch": 3.3412162162162162, "percentage": 83.53, "elapsed_time": "2:04:52", "remaining_time": "0:24:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 990, "total_steps": 1184, "loss": 0.123, "learning_rate": 4.9927253243292505e-05, "epoch": 3.3445945945945947, "percentage": 83.61, "elapsed_time": "2:04:57", "remaining_time": "0:24:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 991, "total_steps": 1184, "loss": 0.1212, "learning_rate": 4.993456090808793e-05, "epoch": 3.347972972972973, "percentage": 83.7, "elapsed_time": "2:05:03", "remaining_time": "0:24:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 992, "total_steps": 1184, "loss": 0.1204, "learning_rate": 4.994186120256965e-05, "epoch": 3.3513513513513513, "percentage": 83.78, "elapsed_time": "2:05:08", "remaining_time": "0:24:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 993, "total_steps": 1184, "loss": 0.1175, "learning_rate": 4.9949154141589696e-05, "epoch": 3.35472972972973, "percentage": 83.87, "elapsed_time": "2:05:13", "remaining_time": "0:24:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 994, "total_steps": 1184, "loss": 0.1198, "learning_rate": 4.995643973995523e-05, "epoch": 3.358108108108108, "percentage": 83.95, "elapsed_time": "2:05:18", "remaining_time": "0:23:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 995, "total_steps": 1184, "loss": 0.1348, "learning_rate": 4.9963718012428765e-05, "epoch": 3.3614864864864864, "percentage": 84.04, "elapsed_time": "2:05:23", "remaining_time": "0:23:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 996, "total_steps": 1184, "loss": 0.1104, "learning_rate": 4.9970988973728314e-05, "epoch": 3.364864864864865, "percentage": 84.12, "elapsed_time": "2:05:28", "remaining_time": "0:23:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 997, "total_steps": 1184, "loss": 0.3864, "learning_rate": 4.99782526385276e-05, "epoch": 3.3682432432432434, "percentage": 84.21, "elapsed_time": "2:05:33", "remaining_time": "0:23:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 998, "total_steps": 1184, "loss": 0.1383, "learning_rate": 4.998550902145619e-05, "epoch": 3.3716216216216215, "percentage": 84.29, "elapsed_time": "2:05:38", "remaining_time": "0:23:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 999, "total_steps": 1184, "loss": 0.1318, "learning_rate": 4.999275813709971e-05, "epoch": 3.375, "percentage": 84.38, "elapsed_time": "2:05:44", "remaining_time": "0:23:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1000, "total_steps": 1184, "loss": 0.1285, "learning_rate": 5e-05, "epoch": 3.3783783783783785, "percentage": 84.46, "elapsed_time": "2:05:49", "remaining_time": "0:23:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1001, "total_steps": 1184, "loss": 0.1125, "learning_rate": 4.9996356488619556e-05, "epoch": 3.3817567567567566, "percentage": 84.54, "elapsed_time": "2:19:33", "remaining_time": "0:25:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1002, "total_steps": 1184, "loss": 0.1221, "learning_rate": 4.9985427016598435e-05, "epoch": 3.385135135135135, "percentage": 84.63, "elapsed_time": "2:19:39", "remaining_time": "0:25:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1003, "total_steps": 1184, "loss": 0.1215, "learning_rate": 4.996721476998771e-05, "epoch": 3.3885135135135136, "percentage": 84.71, "elapsed_time": "2:19:44", "remaining_time": "0:25:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1004, "total_steps": 1184, "loss": 0.1233, "learning_rate": 4.9941725057840504e-05, "epoch": 3.391891891891892, "percentage": 84.8, "elapsed_time": "2:19:49", "remaining_time": "0:25:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1005, "total_steps": 1184, "loss": 0.1149, "learning_rate": 4.9908965310664374e-05, "epoch": 3.39527027027027, "percentage": 84.88, "elapsed_time": "2:19:54", "remaining_time": "0:24:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1006, "total_steps": 1184, "loss": 0.1358, "learning_rate": 4.986894507825522e-05, "epoch": 3.3986486486486487, "percentage": 84.97, "elapsed_time": "2:19:59", "remaining_time": "0:24:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1007, "total_steps": 1184, "loss": 0.132, "learning_rate": 4.9821676026913475e-05, "epoch": 3.402027027027027, "percentage": 85.05, "elapsed_time": "2:20:04", "remaining_time": "0:24:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1008, "total_steps": 1184, "loss": 0.1169, "learning_rate": 4.9767171936043175e-05, "epoch": 3.4054054054054053, "percentage": 85.14, "elapsed_time": "2:20:09", "remaining_time": "0:24:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1009, "total_steps": 1184, "loss": 0.1197, "learning_rate": 4.970544869413522e-05, "epoch": 3.4087837837837838, "percentage": 85.22, "elapsed_time": "2:20:14", "remaining_time": "0:24:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1010, "total_steps": 1184, "loss": 0.1315, "learning_rate": 4.963652429413563e-05, "epoch": 3.4121621621621623, "percentage": 85.3, "elapsed_time": "2:20:19", "remaining_time": "0:24:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1011, "total_steps": 1184, "loss": 0.1187, "learning_rate": 4.9560418828200494e-05, "epoch": 3.4155405405405403, "percentage": 85.39, "elapsed_time": "2:20:24", "remaining_time": "0:24:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1012, "total_steps": 1184, "loss": 0.1353, "learning_rate": 4.9477154481838875e-05, "epoch": 3.418918918918919, "percentage": 85.47, "elapsed_time": "2:20:29", "remaining_time": "0:23:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1013, "total_steps": 1184, "loss": 0.1459, "learning_rate": 4.9386755527445475e-05, "epoch": 3.4222972972972974, "percentage": 85.56, "elapsed_time": "2:20:35", "remaining_time": "0:23:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1014, "total_steps": 1184, "loss": 0.1292, "learning_rate": 4.928924831722504e-05, "epoch": 3.4256756756756754, "percentage": 85.64, "elapsed_time": "2:20:40", "remaining_time": "0:23:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1015, "total_steps": 1184, "loss": 0.1153, "learning_rate": 4.9184661275510446e-05, "epoch": 3.429054054054054, "percentage": 85.73, "elapsed_time": "2:20:45", "remaining_time": "0:23:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1016, "total_steps": 1184, "loss": 0.1179, "learning_rate": 4.907302489047662e-05, "epoch": 3.4324324324324325, "percentage": 85.81, "elapsed_time": "2:20:50", "remaining_time": "0:23:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1017, "total_steps": 1184, "loss": 0.1302, "learning_rate": 4.895437170525303e-05, "epoch": 3.435810810810811, "percentage": 85.9, "elapsed_time": "2:20:55", "remaining_time": "0:23:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1018, "total_steps": 1184, "loss": 0.1302, "learning_rate": 4.882873630843699e-05, "epoch": 3.439189189189189, "percentage": 85.98, "elapsed_time": "2:21:00", "remaining_time": "0:22:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1019, "total_steps": 1184, "loss": 0.1327, "learning_rate": 4.869615532401074e-05, "epoch": 3.4425675675675675, "percentage": 86.06, "elapsed_time": "2:21:05", "remaining_time": "0:22:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1020, "total_steps": 1184, "loss": 0.129, "learning_rate": 4.855666740066522e-05, "epoch": 3.445945945945946, "percentage": 86.15, "elapsed_time": "2:21:10", "remaining_time": "0:22:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1021, "total_steps": 1184, "loss": 0.1243, "learning_rate": 4.841031320053351e-05, "epoch": 3.4493243243243246, "percentage": 86.23, "elapsed_time": "2:21:15", "remaining_time": "0:22:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1022, "total_steps": 1184, "loss": 0.1321, "learning_rate": 4.825713538733748e-05, "epoch": 3.4527027027027026, "percentage": 86.32, "elapsed_time": "2:21:21", "remaining_time": "0:22:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1023, "total_steps": 1184, "loss": 0.186, "learning_rate": 4.80971786139509e-05, "epoch": 3.456081081081081, "percentage": 86.4, "elapsed_time": "2:21:26", "remaining_time": "0:22:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1024, "total_steps": 1184, "loss": 0.6012, "learning_rate": 4.793048950938256e-05, "epoch": 3.4594594594594597, "percentage": 86.49, "elapsed_time": "2:21:31", "remaining_time": "0:22:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1025, "total_steps": 1184, "loss": 0.373, "learning_rate": 4.7757116665183614e-05, "epoch": 3.4628378378378377, "percentage": 86.57, "elapsed_time": "2:21:36", "remaining_time": "0:21:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1026, "total_steps": 1184, "loss": 0.6334, "learning_rate": 4.757711062128251e-05, "epoch": 3.4662162162162162, "percentage": 86.66, "elapsed_time": "2:21:41", "remaining_time": "0:21:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1027, "total_steps": 1184, "loss": 0.6214, "learning_rate": 4.739052385125216e-05, "epoch": 3.4695945945945947, "percentage": 86.74, "elapsed_time": "2:21:46", "remaining_time": "0:21:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1028, "total_steps": 1184, "loss": 0.308, "learning_rate": 4.7197410747013376e-05, "epoch": 3.472972972972973, "percentage": 86.82, "elapsed_time": "2:21:51", "remaining_time": "0:21:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1029, "total_steps": 1184, "loss": 0.3552, "learning_rate": 4.6997827602979024e-05, "epoch": 3.4763513513513513, "percentage": 86.91, "elapsed_time": "2:21:56", "remaining_time": "0:21:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1030, "total_steps": 1184, "loss": 0.3405, "learning_rate": 4.67918325996437e-05, "epoch": 3.47972972972973, "percentage": 86.99, "elapsed_time": "2:22:01", "remaining_time": "0:21:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1031, "total_steps": 1184, "loss": 0.4361, "learning_rate": 4.6579485786623475e-05, "epoch": 3.483108108108108, "percentage": 87.08, "elapsed_time": "2:22:07", "remaining_time": "0:21:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1032, "total_steps": 1184, "loss": 0.1359, "learning_rate": 4.636084906515085e-05, "epoch": 3.4864864864864864, "percentage": 87.16, "elapsed_time": "2:22:12", "remaining_time": "0:20:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1033, "total_steps": 1184, "loss": 0.5506, "learning_rate": 4.6135986170029947e-05, "epoch": 3.489864864864865, "percentage": 87.25, "elapsed_time": "2:22:17", "remaining_time": "0:20:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1034, "total_steps": 1184, "loss": 0.1839, "learning_rate": 4.5904962651057134e-05, "epoch": 3.4932432432432434, "percentage": 87.33, "elapsed_time": "2:22:22", "remaining_time": "0:20:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1035, "total_steps": 1184, "loss": 0.1534, "learning_rate": 4.566784585391263e-05, "epoch": 3.4966216216216215, "percentage": 87.42, "elapsed_time": "2:22:27", "remaining_time": "0:20:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1036, "total_steps": 1184, "loss": 0.1429, "learning_rate": 4.542470490052853e-05, "epoch": 3.5, "percentage": 87.5, "elapsed_time": "2:22:32", "remaining_time": "0:20:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1037, "total_steps": 1184, "loss": 0.1351, "learning_rate": 4.517561066893909e-05, "epoch": 3.5033783783783785, "percentage": 87.58, "elapsed_time": "2:22:37", "remaining_time": "0:20:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1038, "total_steps": 1184, "loss": 0.1312, "learning_rate": 4.492063577261908e-05, "epoch": 3.506756756756757, "percentage": 87.67, "elapsed_time": "2:22:42", "remaining_time": "0:20:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1039, "total_steps": 1184, "loss": 0.1418, "learning_rate": 4.4659854539316174e-05, "epoch": 3.510135135135135, "percentage": 87.75, "elapsed_time": "2:22:47", "remaining_time": "0:19:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1040, "total_steps": 1184, "loss": 0.1465, "learning_rate": 4.439334298938374e-05, "epoch": 3.5135135135135136, "percentage": 87.84, "elapsed_time": "2:22:53", "remaining_time": "0:19:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1041, "total_steps": 1184, "loss": 0.1481, "learning_rate": 4.4121178813620046e-05, "epoch": 3.516891891891892, "percentage": 87.92, "elapsed_time": "2:22:58", "remaining_time": "0:19:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1042, "total_steps": 1184, "loss": 0.1219, "learning_rate": 4.384344135062071e-05, "epoch": 3.52027027027027, "percentage": 88.01, "elapsed_time": "2:23:03", "remaining_time": "0:19:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1043, "total_steps": 1184, "loss": 0.1282, "learning_rate": 4.3560211563650635e-05, "epoch": 3.5236486486486487, "percentage": 88.09, "elapsed_time": "2:23:08", "remaining_time": "0:19:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1044, "total_steps": 1184, "loss": 0.133, "learning_rate": 4.327157201704241e-05, "epoch": 3.527027027027027, "percentage": 88.18, "elapsed_time": "2:23:13", "remaining_time": "0:19:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1045, "total_steps": 1184, "loss": 0.1268, "learning_rate": 4.297760685212801e-05, "epoch": 3.5304054054054053, "percentage": 88.26, "elapsed_time": "2:23:18", "remaining_time": "0:19:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1046, "total_steps": 1184, "loss": 0.1304, "learning_rate": 4.2678401762710726e-05, "epoch": 3.5337837837837838, "percentage": 88.34, "elapsed_time": "2:23:23", "remaining_time": "0:18:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1047, "total_steps": 1184, "loss": 0.134, "learning_rate": 4.237404397008455e-05, "epoch": 3.5371621621621623, "percentage": 88.43, "elapsed_time": "2:23:28", "remaining_time": "0:18:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1048, "total_steps": 1184, "loss": 0.1106, "learning_rate": 4.206462219760831e-05, "epoch": 3.5405405405405403, "percentage": 88.51, "elapsed_time": "2:23:34", "remaining_time": "0:18:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1049, "total_steps": 1184, "loss": 0.1268, "learning_rate": 4.175022664484191e-05, "epoch": 3.543918918918919, "percentage": 88.6, "elapsed_time": "2:23:39", "remaining_time": "0:18:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1050, "total_steps": 1184, "loss": 0.134, "learning_rate": 4.143094896125227e-05, "epoch": 3.5472972972972974, "percentage": 88.68, "elapsed_time": "2:23:44", "remaining_time": "0:18:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1051, "total_steps": 1184, "loss": 0.1185, "learning_rate": 4.1106882219496535e-05, "epoch": 3.5506756756756754, "percentage": 88.77, "elapsed_time": "2:23:49", "remaining_time": "0:18:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1052, "total_steps": 1184, "loss": 0.1251, "learning_rate": 4.077812088829051e-05, "epoch": 3.554054054054054, "percentage": 88.85, "elapsed_time": "2:23:54", "remaining_time": "0:18:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1053, "total_steps": 1184, "loss": 0.1405, "learning_rate": 4.044476080487005e-05, "epoch": 3.5574324324324325, "percentage": 88.94, "elapsed_time": "2:23:59", "remaining_time": "0:17:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1054, "total_steps": 1184, "loss": 0.1162, "learning_rate": 4.0106899147053564e-05, "epoch": 3.560810810810811, "percentage": 89.02, "elapsed_time": "2:24:04", "remaining_time": "0:17:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1055, "total_steps": 1184, "loss": 0.123, "learning_rate": 3.976463440491367e-05, "epoch": 3.564189189189189, "percentage": 89.1, "elapsed_time": "2:24:10", "remaining_time": "0:17:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1056, "total_steps": 1184, "loss": 0.1276, "learning_rate": 3.941806635206639e-05, "epoch": 3.5675675675675675, "percentage": 89.19, "elapsed_time": "2:24:15", "remaining_time": "0:17:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1057, "total_steps": 1184, "loss": 0.1336, "learning_rate": 3.9067296016586105e-05, "epoch": 3.570945945945946, "percentage": 89.27, "elapsed_time": "2:24:20", "remaining_time": "0:17:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1058, "total_steps": 1184, "loss": 0.1267, "learning_rate": 3.871242565155485e-05, "epoch": 3.5743243243243246, "percentage": 89.36, "elapsed_time": "2:24:25", "remaining_time": "0:17:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1059, "total_steps": 1184, "loss": 0.4067, "learning_rate": 3.835355870525455e-05, "epoch": 3.5777027027027026, "percentage": 89.44, "elapsed_time": "2:24:30", "remaining_time": "0:17:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1060, "total_steps": 1184, "loss": 0.1231, "learning_rate": 3.799079979101075e-05, "epoch": 3.581081081081081, "percentage": 89.53, "elapsed_time": "2:24:35", "remaining_time": "0:16:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1061, "total_steps": 1184, "loss": 0.1405, "learning_rate": 3.7624254656696864e-05, "epoch": 3.5844594594594597, "percentage": 89.61, "elapsed_time": "2:24:40", "remaining_time": "0:16:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1062, "total_steps": 1184, "loss": 0.118, "learning_rate": 3.7254030153907494e-05, "epoch": 3.5878378378378377, "percentage": 89.7, "elapsed_time": "2:24:45", "remaining_time": "0:16:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1063, "total_steps": 1184, "loss": 0.127, "learning_rate": 3.688023420681019e-05, "epoch": 3.5912162162162162, "percentage": 89.78, "elapsed_time": "2:24:51", "remaining_time": "0:16:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1064, "total_steps": 1184, "loss": 0.1238, "learning_rate": 3.650297578068448e-05, "epoch": 3.5945945945945947, "percentage": 89.86, "elapsed_time": "2:24:56", "remaining_time": "0:16:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1065, "total_steps": 1184, "loss": 0.1342, "learning_rate": 3.6122364850157326e-05, "epoch": 3.597972972972973, "percentage": 89.95, "elapsed_time": "2:25:01", "remaining_time": "0:16:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1066, "total_steps": 1184, "loss": 0.1108, "learning_rate": 3.573851236714447e-05, "epoch": 3.6013513513513513, "percentage": 90.03, "elapsed_time": "2:25:06", "remaining_time": "0:16:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1067, "total_steps": 1184, "loss": 0.1279, "learning_rate": 3.535153022850684e-05, "epoch": 3.60472972972973, "percentage": 90.12, "elapsed_time": "2:25:11", "remaining_time": "0:15:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1068, "total_steps": 1184, "loss": 0.1263, "learning_rate": 3.496153124343142e-05, "epoch": 3.608108108108108, "percentage": 90.2, "elapsed_time": "2:25:16", "remaining_time": "0:15:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1069, "total_steps": 1184, "loss": 0.1185, "learning_rate": 3.4568629100546333e-05, "epoch": 3.6114864864864864, "percentage": 90.29, "elapsed_time": "2:25:21", "remaining_time": "0:15:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1070, "total_steps": 1184, "loss": 0.1222, "learning_rate": 3.417293833477938e-05, "epoch": 3.614864864864865, "percentage": 90.37, "elapsed_time": "2:25:26", "remaining_time": "0:15:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1071, "total_steps": 1184, "loss": 0.1196, "learning_rate": 3.377457429397001e-05, "epoch": 3.618243243243243, "percentage": 90.46, "elapsed_time": "2:25:32", "remaining_time": "0:15:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1072, "total_steps": 1184, "loss": 0.1291, "learning_rate": 3.337365310524423e-05, "epoch": 3.6216216216216215, "percentage": 90.54, "elapsed_time": "2:25:37", "remaining_time": "0:15:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1073, "total_steps": 1184, "loss": 0.1267, "learning_rate": 3.2970291641162396e-05, "epoch": 3.625, "percentage": 90.62, "elapsed_time": "2:25:42", "remaining_time": "0:15:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1074, "total_steps": 1184, "loss": 0.1207, "learning_rate": 3.25646074856497e-05, "epoch": 3.6283783783783785, "percentage": 90.71, "elapsed_time": "2:25:47", "remaining_time": "0:14:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1075, "total_steps": 1184, "loss": 0.372, "learning_rate": 3.2156718899719216e-05, "epoch": 3.631756756756757, "percentage": 90.79, "elapsed_time": "2:25:52", "remaining_time": "0:14:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1076, "total_steps": 1184, "loss": 0.1273, "learning_rate": 3.174674478699772e-05, "epoch": 3.635135135135135, "percentage": 90.88, "elapsed_time": "2:25:57", "remaining_time": "0:14:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1077, "total_steps": 1184, "loss": 0.1256, "learning_rate": 3.133480465906398e-05, "epoch": 3.6385135135135136, "percentage": 90.96, "elapsed_time": "2:26:02", "remaining_time": "0:14:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1078, "total_steps": 1184, "loss": 0.1334, "learning_rate": 3.092101860061e-05, "epoch": 3.641891891891892, "percentage": 91.05, "elapsed_time": "2:26:08", "remaining_time": "0:14:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1079, "total_steps": 1184, "loss": 0.111, "learning_rate": 3.0505507234435122e-05, "epoch": 3.64527027027027, "percentage": 91.13, "elapsed_time": "2:26:13", "remaining_time": "0:14:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1080, "total_steps": 1184, "loss": 0.1348, "learning_rate": 3.0088391686283214e-05, "epoch": 3.6486486486486487, "percentage": 91.22, "elapsed_time": "2:26:18", "remaining_time": "0:14:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1081, "total_steps": 1184, "loss": 0.1262, "learning_rate": 2.966979354953336e-05, "epoch": 3.652027027027027, "percentage": 91.3, "elapsed_time": "2:26:23", "remaining_time": "0:13:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1082, "total_steps": 1184, "loss": 0.1185, "learning_rate": 2.92498348497541e-05, "epoch": 3.6554054054054053, "percentage": 91.39, "elapsed_time": "2:26:28", "remaining_time": "0:13:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1083, "total_steps": 1184, "loss": 0.1248, "learning_rate": 2.882863800913182e-05, "epoch": 3.6587837837837838, "percentage": 91.47, "elapsed_time": "2:26:33", "remaining_time": "0:13:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1084, "total_steps": 1184, "loss": 0.1282, "learning_rate": 2.8406325810783425e-05, "epoch": 3.6621621621621623, "percentage": 91.55, "elapsed_time": "2:26:38", "remaining_time": "0:13:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1085, "total_steps": 1184, "loss": 0.1098, "learning_rate": 2.798302136296379e-05, "epoch": 3.6655405405405403, "percentage": 91.64, "elapsed_time": "2:26:43", "remaining_time": "0:13:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1086, "total_steps": 1184, "loss": 0.1129, "learning_rate": 2.7558848063178506e-05, "epoch": 3.668918918918919, "percentage": 91.72, "elapsed_time": "2:26:49", "remaining_time": "0:13:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1087, "total_steps": 1184, "loss": 0.1187, "learning_rate": 2.713392956221225e-05, "epoch": 3.6722972972972974, "percentage": 91.81, "elapsed_time": "2:26:54", "remaining_time": "0:13:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1088, "total_steps": 1184, "loss": 0.1311, "learning_rate": 2.6708389728083372e-05, "epoch": 3.6756756756756754, "percentage": 91.89, "elapsed_time": "2:26:59", "remaining_time": "0:12:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1089, "total_steps": 1184, "loss": 0.1294, "learning_rate": 2.6282352609935028e-05, "epoch": 3.679054054054054, "percentage": 91.98, "elapsed_time": "2:27:04", "remaining_time": "0:12:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1090, "total_steps": 1184, "loss": 0.128, "learning_rate": 2.5855942401873734e-05, "epoch": 3.6824324324324325, "percentage": 92.06, "elapsed_time": "2:27:09", "remaining_time": "0:12:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1091, "total_steps": 1184, "loss": 0.1373, "learning_rate": 2.5429283406765436e-05, "epoch": 3.685810810810811, "percentage": 92.15, "elapsed_time": "2:27:14", "remaining_time": "0:12:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1092, "total_steps": 1184, "loss": 0.115, "learning_rate": 2.50025e-05, "epoch": 3.689189189189189, "percentage": 92.23, "elapsed_time": "2:27:19", "remaining_time": "0:12:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1093, "total_steps": 1184, "loss": 0.105, "learning_rate": 2.4575716593234574e-05, "epoch": 3.6925675675675675, "percentage": 92.31, "elapsed_time": "2:27:24", "remaining_time": "0:12:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1094, "total_steps": 1184, "loss": 0.1215, "learning_rate": 2.414905759812627e-05, "epoch": 3.695945945945946, "percentage": 92.4, "elapsed_time": "2:27:30", "remaining_time": "0:12:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1095, "total_steps": 1184, "loss": 0.1121, "learning_rate": 2.372264739006497e-05, "epoch": 3.6993243243243246, "percentage": 92.48, "elapsed_time": "2:27:35", "remaining_time": "0:11:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1096, "total_steps": 1184, "loss": 0.1142, "learning_rate": 2.329661027191664e-05, "epoch": 3.7027027027027026, "percentage": 92.57, "elapsed_time": "2:27:40", "remaining_time": "0:11:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1097, "total_steps": 1184, "loss": 0.1132, "learning_rate": 2.287107043778775e-05, "epoch": 3.706081081081081, "percentage": 92.65, "elapsed_time": "2:27:45", "remaining_time": "0:11:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1098, "total_steps": 1184, "loss": 0.1129, "learning_rate": 2.2446151936821504e-05, "epoch": 3.7094594594594597, "percentage": 92.74, "elapsed_time": "2:27:50", "remaining_time": "0:11:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1099, "total_steps": 1184, "loss": 0.1268, "learning_rate": 2.2021978637036214e-05, "epoch": 3.7128378378378377, "percentage": 92.82, "elapsed_time": "2:27:55", "remaining_time": "0:11:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1100, "total_steps": 1184, "loss": 0.1285, "learning_rate": 2.1598674189216575e-05, "epoch": 3.7162162162162162, "percentage": 92.91, "elapsed_time": "2:28:00", "remaining_time": "0:11:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1101, "total_steps": 1184, "loss": 0.116, "learning_rate": 2.117636199086818e-05, "epoch": 3.7195945945945947, "percentage": 92.99, "elapsed_time": "2:28:05", "remaining_time": "0:11:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1102, "total_steps": 1184, "loss": 0.1137, "learning_rate": 2.0755165150245906e-05, "epoch": 3.722972972972973, "percentage": 93.07, "elapsed_time": "2:28:11", "remaining_time": "0:11:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1103, "total_steps": 1184, "loss": 0.1153, "learning_rate": 2.0335206450466658e-05, "epoch": 3.7263513513513513, "percentage": 93.16, "elapsed_time": "2:28:16", "remaining_time": "0:10:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1104, "total_steps": 1184, "loss": 0.1131, "learning_rate": 1.9916608313716786e-05, "epoch": 3.72972972972973, "percentage": 93.24, "elapsed_time": "2:28:21", "remaining_time": "0:10:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1105, "total_steps": 1184, "loss": 0.1123, "learning_rate": 1.9499492765564878e-05, "epoch": 3.733108108108108, "percentage": 93.33, "elapsed_time": "2:28:26", "remaining_time": "0:10:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1106, "total_steps": 1184, "loss": 0.1156, "learning_rate": 1.9083981399389997e-05, "epoch": 3.7364864864864864, "percentage": 93.41, "elapsed_time": "2:28:31", "remaining_time": "0:10:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1107, "total_steps": 1184, "loss": 0.1164, "learning_rate": 1.8670195340936026e-05, "epoch": 3.739864864864865, "percentage": 93.5, "elapsed_time": "2:28:36", "remaining_time": "0:10:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1108, "total_steps": 1184, "loss": 0.1077, "learning_rate": 1.825825521300229e-05, "epoch": 3.743243243243243, "percentage": 93.58, "elapsed_time": "2:28:41", "remaining_time": "0:10:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1109, "total_steps": 1184, "loss": 0.1053, "learning_rate": 1.7848281100280788e-05, "epoch": 3.7466216216216215, "percentage": 93.67, "elapsed_time": "2:28:46", "remaining_time": "0:10:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1110, "total_steps": 1184, "loss": 0.1226, "learning_rate": 1.7440392514350303e-05, "epoch": 3.75, "percentage": 93.75, "elapsed_time": "2:28:52", "remaining_time": "0:09:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1111, "total_steps": 1184, "loss": 0.0983, "learning_rate": 1.7034708358837607e-05, "epoch": 3.7533783783783785, "percentage": 93.83, "elapsed_time": "2:28:57", "remaining_time": "0:09:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1112, "total_steps": 1184, "loss": 0.1274, "learning_rate": 1.6631346894755773e-05, "epoch": 3.756756756756757, "percentage": 93.92, "elapsed_time": "2:29:02", "remaining_time": "0:09:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1113, "total_steps": 1184, "loss": 0.1203, "learning_rate": 1.6230425706029996e-05, "epoch": 3.760135135135135, "percentage": 94.0, "elapsed_time": "2:29:07", "remaining_time": "0:09:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1114, "total_steps": 1184, "loss": 0.1122, "learning_rate": 1.5832061665220622e-05, "epoch": 3.7635135135135136, "percentage": 94.09, "elapsed_time": "2:29:12", "remaining_time": "0:09:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1115, "total_steps": 1184, "loss": 0.1139, "learning_rate": 1.5436370899453666e-05, "epoch": 3.766891891891892, "percentage": 94.17, "elapsed_time": "2:29:17", "remaining_time": "0:09:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1116, "total_steps": 1184, "loss": 0.1195, "learning_rate": 1.504346875656858e-05, "epoch": 3.77027027027027, "percentage": 94.26, "elapsed_time": "2:29:22", "remaining_time": "0:09:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1117, "total_steps": 1184, "loss": 0.1018, "learning_rate": 1.4653469771493166e-05, "epoch": 3.7736486486486487, "percentage": 94.34, "elapsed_time": "2:29:27", "remaining_time": "0:08:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1118, "total_steps": 1184, "loss": 0.1044, "learning_rate": 1.426648763285553e-05, "epoch": 3.777027027027027, "percentage": 94.43, "elapsed_time": "2:29:33", "remaining_time": "0:08:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1119, "total_steps": 1184, "loss": 0.0976, "learning_rate": 1.3882635149842685e-05, "epoch": 3.7804054054054053, "percentage": 94.51, "elapsed_time": "2:29:38", "remaining_time": "0:08:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1120, "total_steps": 1184, "loss": 0.1159, "learning_rate": 1.3502024219315524e-05, "epoch": 3.7837837837837838, "percentage": 94.59, "elapsed_time": "2:29:43", "remaining_time": "0:08:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1121, "total_steps": 1184, "loss": 0.108, "learning_rate": 1.3124765793189808e-05, "epoch": 3.7871621621621623, "percentage": 94.68, "elapsed_time": "2:29:48", "remaining_time": "0:08:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1122, "total_steps": 1184, "loss": 0.1011, "learning_rate": 1.2750969846092514e-05, "epoch": 3.7905405405405403, "percentage": 94.76, "elapsed_time": "2:29:53", "remaining_time": "0:08:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1123, "total_steps": 1184, "loss": 0.115, "learning_rate": 1.2380745343303146e-05, "epoch": 3.793918918918919, "percentage": 94.85, "elapsed_time": "2:29:58", "remaining_time": "0:08:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1124, "total_steps": 1184, "loss": 0.1136, "learning_rate": 1.2014200208989255e-05, "epoch": 3.7972972972972974, "percentage": 94.93, "elapsed_time": "2:30:03", "remaining_time": "0:08:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1125, "total_steps": 1184, "loss": 0.1172, "learning_rate": 1.165144129474546e-05, "epoch": 3.8006756756756754, "percentage": 95.02, "elapsed_time": "2:30:09", "remaining_time": "0:07:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1126, "total_steps": 1184, "loss": 0.1107, "learning_rate": 1.1292574348445151e-05, "epoch": 3.804054054054054, "percentage": 95.1, "elapsed_time": "2:30:14", "remaining_time": "0:07:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1127, "total_steps": 1184, "loss": 0.0962, "learning_rate": 1.0937703983413898e-05, "epoch": 3.8074324324324325, "percentage": 95.19, "elapsed_time": "2:30:19", "remaining_time": "0:07:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1128, "total_steps": 1184, "loss": 0.1168, "learning_rate": 1.058693364793361e-05, "epoch": 3.810810810810811, "percentage": 95.27, "elapsed_time": "2:30:24", "remaining_time": "0:07:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1129, "total_steps": 1184, "loss": 0.1167, "learning_rate": 1.0240365595086335e-05, "epoch": 3.814189189189189, "percentage": 95.35, "elapsed_time": "2:30:29", "remaining_time": "0:07:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1130, "total_steps": 1184, "loss": 0.1209, "learning_rate": 9.898100852946441e-06, "epoch": 3.8175675675675675, "percentage": 95.44, "elapsed_time": "2:30:34", "remaining_time": "0:07:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1131, "total_steps": 1184, "loss": 0.1062, "learning_rate": 9.560239195129949e-06, "epoch": 3.820945945945946, "percentage": 95.52, "elapsed_time": "2:30:39", "remaining_time": "0:07:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1132, "total_steps": 1184, "loss": 0.1091, "learning_rate": 9.226879111709494e-06, "epoch": 3.8243243243243246, "percentage": 95.61, "elapsed_time": "2:30:44", "remaining_time": "0:06:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1133, "total_steps": 1184, "loss": 0.1029, "learning_rate": 8.898117780503471e-06, "epoch": 3.8277027027027026, "percentage": 95.69, "elapsed_time": "2:30:50", "remaining_time": "0:06:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1134, "total_steps": 1184, "loss": 0.1121, "learning_rate": 8.574051038747738e-06, "epoch": 3.831081081081081, "percentage": 95.78, "elapsed_time": "2:30:55", "remaining_time": "0:06:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1135, "total_steps": 1184, "loss": 0.1007, "learning_rate": 8.254773355158088e-06, "epoch": 3.8344594594594597, "percentage": 95.86, "elapsed_time": "2:31:00", "remaining_time": "0:06:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1136, "total_steps": 1184, "loss": 0.1146, "learning_rate": 7.94037780239169e-06, "epoch": 3.8378378378378377, "percentage": 95.95, "elapsed_time": "2:31:05", "remaining_time": "0:06:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1137, "total_steps": 1184, "loss": 0.1016, "learning_rate": 7.630956029915455e-06, "epoch": 3.8412162162162162, "percentage": 96.03, "elapsed_time": "2:31:10", "remaining_time": "0:06:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1138, "total_steps": 1184, "loss": 0.0989, "learning_rate": 7.32659823728928e-06, "epoch": 3.8445945945945947, "percentage": 96.11, "elapsed_time": "2:31:15", "remaining_time": "0:06:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1139, "total_steps": 1184, "loss": 0.1031, "learning_rate": 7.027393147871994e-06, "epoch": 3.847972972972973, "percentage": 96.2, "elapsed_time": "2:31:20", "remaining_time": "0:05:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1140, "total_steps": 1184, "loss": 0.1105, "learning_rate": 6.733427982957593e-06, "epoch": 3.8513513513513513, "percentage": 96.28, "elapsed_time": "2:31:25", "remaining_time": "0:05:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1141, "total_steps": 1184, "loss": 0.1155, "learning_rate": 6.444788436349374e-06, "epoch": 3.85472972972973, "percentage": 96.37, "elapsed_time": "2:31:31", "remaining_time": "0:05:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1142, "total_steps": 1184, "loss": 0.1113, "learning_rate": 6.16155864937929e-06, "epoch": 3.858108108108108, "percentage": 96.45, "elapsed_time": "2:31:36", "remaining_time": "0:05:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1143, "total_steps": 1184, "loss": 0.1113, "learning_rate": 5.883821186379955e-06, "epoch": 3.8614864864864864, "percentage": 96.54, "elapsed_time": "2:31:41", "remaining_time": "0:05:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1144, "total_steps": 1184, "loss": 0.1173, "learning_rate": 5.6116570106162695e-06, "epoch": 3.864864864864865, "percentage": 96.62, "elapsed_time": "2:31:46", "remaining_time": "0:05:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1145, "total_steps": 1184, "loss": 0.1076, "learning_rate": 5.345145460683825e-06, "epoch": 3.868243243243243, "percentage": 96.71, "elapsed_time": "2:31:51", "remaining_time": "0:05:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1146, "total_steps": 1184, "loss": 0.1073, "learning_rate": 5.0843642273809276e-06, "epoch": 3.8716216216216215, "percentage": 96.79, "elapsed_time": "2:31:56", "remaining_time": "0:05:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1147, "total_steps": 1184, "loss": 0.1016, "learning_rate": 4.82938933106091e-06, "epoch": 3.875, "percentage": 96.88, "elapsed_time": "2:32:01", "remaining_time": "0:04:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1148, "total_steps": 1184, "loss": 0.1038, "learning_rate": 4.5802950994714764e-06, "epoch": 3.8783783783783785, "percentage": 96.96, "elapsed_time": "2:32:06", "remaining_time": "0:04:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1149, "total_steps": 1184, "loss": 0.1083, "learning_rate": 4.337154146087377e-06, "epoch": 3.881756756756757, "percentage": 97.04, "elapsed_time": "2:32:12", "remaining_time": "0:04:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1150, "total_steps": 1184, "loss": 0.099, "learning_rate": 4.100037348942866e-06, "epoch": 3.885135135135135, "percentage": 97.13, "elapsed_time": "2:32:17", "remaining_time": "0:04:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1151, "total_steps": 1184, "loss": 0.1017, "learning_rate": 3.869013829970057e-06, "epoch": 3.8885135135135136, "percentage": 97.21, "elapsed_time": "2:32:22", "remaining_time": "0:04:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1152, "total_steps": 1184, "loss": 0.1, "learning_rate": 3.644150934849158e-06, "epoch": 3.891891891891892, "percentage": 97.3, "elapsed_time": "2:32:27", "remaining_time": "0:04:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1153, "total_steps": 1184, "loss": 0.1023, "learning_rate": 3.425514213376533e-06, "epoch": 3.89527027027027, "percentage": 97.38, "elapsed_time": "2:32:32", "remaining_time": "0:04:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1154, "total_steps": 1184, "loss": 0.0937, "learning_rate": 3.213167400356303e-06, "epoch": 3.8986486486486487, "percentage": 97.47, "elapsed_time": "2:32:37", "remaining_time": "0:03:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1155, "total_steps": 1184, "loss": 0.1108, "learning_rate": 3.007172397020972e-06, "epoch": 3.902027027027027, "percentage": 97.55, "elapsed_time": "2:32:42", "remaining_time": "0:03:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1156, "total_steps": 1184, "loss": 0.1025, "learning_rate": 2.8075892529866257e-06, "epoch": 3.9054054054054053, "percentage": 97.64, "elapsed_time": "2:32:48", "remaining_time": "0:03:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1157, "total_steps": 1184, "loss": 0.107, "learning_rate": 2.6144761487478416e-06, "epoch": 3.9087837837837838, "percentage": 97.72, "elapsed_time": "2:32:53", "remaining_time": "0:03:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1158, "total_steps": 1184, "loss": 0.1216, "learning_rate": 2.4278893787174935e-06, "epoch": 3.9121621621621623, "percentage": 97.8, "elapsed_time": "2:32:58", "remaining_time": "0:03:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1159, "total_steps": 1184, "loss": 0.3528, "learning_rate": 2.2478833348163886e-06, "epoch": 3.9155405405405403, "percentage": 97.89, "elapsed_time": "2:33:03", "remaining_time": "0:03:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1160, "total_steps": 1184, "loss": 0.0981, "learning_rate": 2.074510490617438e-06, "epoch": 3.918918918918919, "percentage": 97.97, "elapsed_time": "2:33:08", "remaining_time": "0:03:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1161, "total_steps": 1184, "loss": 0.1003, "learning_rate": 1.9078213860491097e-06, "epoch": 3.9222972972972974, "percentage": 98.06, "elapsed_time": "2:33:13", "remaining_time": "0:03:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1162, "total_steps": 1184, "loss": 0.096, "learning_rate": 1.7478646126625187e-06, "epoch": 3.9256756756756754, "percentage": 98.14, "elapsed_time": "2:33:18", "remaining_time": "0:02:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1163, "total_steps": 1184, "loss": 0.1062, "learning_rate": 1.5946867994665007e-06, "epoch": 3.929054054054054, "percentage": 98.23, "elapsed_time": "2:33:23", "remaining_time": "0:02:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1164, "total_steps": 1184, "loss": 0.102, "learning_rate": 1.4483325993347872e-06, "epoch": 3.9324324324324325, "percentage": 98.31, "elapsed_time": "2:33:29", "remaining_time": "0:02:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1165, "total_steps": 1184, "loss": 0.1049, "learning_rate": 1.308844675989258e-06, "epoch": 3.935810810810811, "percentage": 98.4, "elapsed_time": "2:33:35", "remaining_time": "0:02:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1166, "total_steps": 1184, "loss": 0.1019, "learning_rate": 1.1762636915630122e-06, "epoch": 3.939189189189189, "percentage": 98.48, "elapsed_time": "2:33:40", "remaining_time": "0:02:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1167, "total_steps": 1184, "loss": 0.0962, "learning_rate": 1.0506282947469768e-06, "epoch": 3.9425675675675675, "percentage": 98.56, "elapsed_time": "2:33:45", "remaining_time": "0:02:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1168, "total_steps": 1184, "loss": 0.3502, "learning_rate": 9.319751095233885e-07, "epoch": 3.945945945945946, "percentage": 98.65, "elapsed_time": "2:33:50", "remaining_time": "0:02:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1169, "total_steps": 1184, "loss": 0.0968, "learning_rate": 8.203387244895631e-07, "epoch": 3.9493243243243246, "percentage": 98.73, "elapsed_time": "2:33:55", "remaining_time": "0:01:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1170, "total_steps": 1184, "loss": 0.1097, "learning_rate": 7.157516827749585e-07, "epoch": 3.9527027027027026, "percentage": 98.82, "elapsed_time": "2:34:00", "remaining_time": "0:01:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1171, "total_steps": 1184, "loss": 0.1067, "learning_rate": 6.182444725545342e-07, "epoch": 3.956081081081081, "percentage": 98.9, "elapsed_time": "2:34:06", "remaining_time": "0:01:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1172, "total_steps": 1184, "loss": 0.1061, "learning_rate": 5.278455181611357e-07, "epoch": 3.9594594594594597, "percentage": 98.99, "elapsed_time": "2:34:11", "remaining_time": "0:01:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1173, "total_steps": 1184, "loss": 0.1081, "learning_rate": 4.445811717995063e-07, "epoch": 3.9628378378378377, "percentage": 99.07, "elapsed_time": "2:34:16", "remaining_time": "0:01:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1174, "total_steps": 1184, "loss": 0.097, "learning_rate": 3.684757058643714e-07, "epoch": 3.9662162162162162, "percentage": 99.16, "elapsed_time": "2:34:23", "remaining_time": "0:01:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1175, "total_steps": 1184, "loss": 0.1069, "learning_rate": 2.995513058647855e-07, "epoch": 3.9695945945945947, "percentage": 99.24, "elapsed_time": "2:34:28", "remaining_time": "0:01:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1176, "total_steps": 1184, "loss": 0.1168, "learning_rate": 2.3782806395682474e-07, "epoch": 3.972972972972973, "percentage": 99.32, "elapsed_time": "2:34:33", "remaining_time": "0:01:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1177, "total_steps": 1184, "loss": 0.105, "learning_rate": 1.8332397308652485e-07, "epoch": 3.9763513513513513, "percentage": 99.41, "elapsed_time": "2:34:39", "remaining_time": "0:00:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1178, "total_steps": 1184, "loss": 0.0984, "learning_rate": 1.3605492174477425e-07, "epoch": 3.97972972972973, "percentage": 99.49, "elapsed_time": "2:34:44", "remaining_time": "0:00:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1179, "total_steps": 1184, "loss": 0.1039, "learning_rate": 9.603468933562955e-08, "epoch": 3.983108108108108, "percentage": 99.58, "elapsed_time": "2:34:49", "remaining_time": "0:00:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1180, "total_steps": 1184, "loss": 0.098, "learning_rate": 6.32749421594948e-08, "epoch": 3.9864864864864864, "percentage": 99.66, "elapsed_time": "2:34:54", "remaining_time": "0:00:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1181, "total_steps": 1184, "loss": 0.1196, "learning_rate": 3.778523001229054e-08, "epoch": 3.989864864864865, "percentage": 99.75, "elapsed_time": "2:34:59", "remaining_time": "0:00:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1182, "total_steps": 1184, "loss": 0.1071, "learning_rate": 1.957298340156484e-08, "epoch": 3.993243243243243, "percentage": 99.83, "elapsed_time": "2:35:04", "remaining_time": "0:00:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1183, "total_steps": 1184, "loss": 0.1043, "learning_rate": 8.64351138044836e-09, "epoch": 3.9966216216216215, "percentage": 99.92, "elapsed_time": "2:35:09", "remaining_time": "0:00:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1184, "total_steps": 1184, "loss": 0.0813, "learning_rate": 5e-09, "epoch": 4.0, "percentage": 100.0, "elapsed_time": "2:35:15", "remaining_time": "0:00:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1184, "total_steps": 1184, "epoch": 4.0, "percentage": 100.0, "elapsed_time": "2:49:56", "remaining_time": "0:00:00", "throughput": "0.00", "total_tokens": 0}