{"current_steps": 2, "total_steps": 3080, "loss": 1.1716, "learning_rate": 1.298701298701299e-07, "epoch": 0.0012980691221807562, "percentage": 0.06, "elapsed_time": "0:00:35", "remaining_time": "15:01:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4, "total_steps": 3080, "loss": 1.1279, "learning_rate": 2.597402597402598e-07, "epoch": 0.0025961382443615124, "percentage": 0.13, "elapsed_time": "0:01:16", "remaining_time": "16:18:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6, "total_steps": 3080, "loss": 1.2463, "learning_rate": 3.896103896103896e-07, "epoch": 0.0038942073665422685, "percentage": 0.19, "elapsed_time": "0:01:58", "remaining_time": "16:48:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8, "total_steps": 3080, "loss": 1.1527, "learning_rate": 5.194805194805196e-07, "epoch": 0.005192276488723025, "percentage": 0.26, "elapsed_time": "0:02:38", "remaining_time": "16:51:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10, "total_steps": 3080, "loss": 1.1291, "learning_rate": 6.493506493506493e-07, "epoch": 0.0064903456109037805, "percentage": 0.32, "elapsed_time": "0:03:17", "remaining_time": "16:52:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12, "total_steps": 3080, "loss": 1.1338, "learning_rate": 7.792207792207792e-07, "epoch": 0.007788414733084537, "percentage": 0.39, "elapsed_time": "0:03:59", "remaining_time": "17:00:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14, "total_steps": 3080, "loss": 1.136, "learning_rate": 9.090909090909091e-07, "epoch": 0.009086483855265294, "percentage": 0.45, "elapsed_time": "0:04:36", "remaining_time": "16:50:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16, "total_steps": 3080, "loss": 1.1277, "learning_rate": 1.0389610389610392e-06, "epoch": 0.01038455297744605, "percentage": 0.52, "elapsed_time": "0:05:15", "remaining_time": "16:45:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 18, "total_steps": 3080, "loss": 1.117, "learning_rate": 1.168831168831169e-06, "epoch": 0.011682622099626805, "percentage": 0.58, "elapsed_time": "0:05:55", "remaining_time": "16:47:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 20, "total_steps": 3080, "loss": 1.1154, "learning_rate": 1.2987012987012986e-06, "epoch": 0.012980691221807561, "percentage": 0.65, "elapsed_time": "0:06:34", "remaining_time": "16:46:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 22, "total_steps": 3080, "loss": 1.0971, "learning_rate": 1.4285714285714286e-06, "epoch": 0.014278760343988317, "percentage": 0.71, "elapsed_time": "0:07:16", "remaining_time": "16:50:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 24, "total_steps": 3080, "loss": 1.1125, "learning_rate": 1.5584415584415584e-06, "epoch": 0.015576829466169074, "percentage": 0.78, "elapsed_time": "0:07:52", "remaining_time": "16:43:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 26, "total_steps": 3080, "loss": 1.0816, "learning_rate": 1.6883116883116885e-06, "epoch": 0.01687489858834983, "percentage": 0.84, "elapsed_time": "0:08:34", "remaining_time": "16:47:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 28, "total_steps": 3080, "loss": 1.024, "learning_rate": 1.8181818181818183e-06, "epoch": 0.018172967710530587, "percentage": 0.91, "elapsed_time": "0:09:20", "remaining_time": "16:58:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 30, "total_steps": 3080, "loss": 1.009, "learning_rate": 1.9480519480519483e-06, "epoch": 0.01947103683271134, "percentage": 0.97, "elapsed_time": "0:09:58", "remaining_time": "16:54:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 32, "total_steps": 3080, "loss": 0.9808, "learning_rate": 2.0779220779220784e-06, "epoch": 0.0207691059548921, "percentage": 1.04, "elapsed_time": "0:10:39", "remaining_time": "16:55:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 34, "total_steps": 3080, "loss": 0.9697, "learning_rate": 2.207792207792208e-06, "epoch": 0.022067175077072853, "percentage": 1.1, "elapsed_time": "0:11:18", "remaining_time": "16:53:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 36, "total_steps": 3080, "loss": 0.9016, "learning_rate": 2.337662337662338e-06, "epoch": 0.02336524419925361, "percentage": 1.17, "elapsed_time": "0:11:58", "remaining_time": "16:53:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 38, "total_steps": 3080, "loss": 0.8959, "learning_rate": 2.4675324675324676e-06, "epoch": 0.024663313321434368, "percentage": 1.23, "elapsed_time": "0:12:40", "remaining_time": "16:54:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 40, "total_steps": 3080, "loss": 0.8125, "learning_rate": 2.597402597402597e-06, "epoch": 0.025961382443615122, "percentage": 1.3, "elapsed_time": "0:13:19", "remaining_time": "16:52:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 42, "total_steps": 3080, "loss": 0.8685, "learning_rate": 2.7272727272727272e-06, "epoch": 0.02725945156579588, "percentage": 1.36, "elapsed_time": "0:13:59", "remaining_time": "16:52:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 44, "total_steps": 3080, "loss": 0.7961, "learning_rate": 2.8571428571428573e-06, "epoch": 0.028557520687976633, "percentage": 1.43, "elapsed_time": "0:14:41", "remaining_time": "16:53:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 46, "total_steps": 3080, "loss": 0.7846, "learning_rate": 2.9870129870129873e-06, "epoch": 0.02985558981015739, "percentage": 1.49, "elapsed_time": "0:15:21", "remaining_time": "16:53:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 48, "total_steps": 3080, "loss": 0.7042, "learning_rate": 3.116883116883117e-06, "epoch": 0.03115365893233815, "percentage": 1.56, "elapsed_time": "0:16:02", "remaining_time": "16:52:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 50, "total_steps": 3080, "loss": 0.7043, "learning_rate": 3.246753246753247e-06, "epoch": 0.0324517280545189, "percentage": 1.62, "elapsed_time": "0:16:43", "remaining_time": "16:53:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 52, "total_steps": 3080, "loss": 0.6678, "learning_rate": 3.376623376623377e-06, "epoch": 0.03374979717669966, "percentage": 1.69, "elapsed_time": "0:17:22", "remaining_time": "16:51:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 54, "total_steps": 3080, "loss": 0.7099, "learning_rate": 3.506493506493507e-06, "epoch": 0.03504786629888042, "percentage": 1.75, "elapsed_time": "0:17:57", "remaining_time": "16:46:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 56, "total_steps": 3080, "loss": 0.6423, "learning_rate": 3.6363636363636366e-06, "epoch": 0.036345935421061175, "percentage": 1.82, "elapsed_time": "0:18:44", "remaining_time": "16:51:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 58, "total_steps": 3080, "loss": 0.5418, "learning_rate": 3.7662337662337666e-06, "epoch": 0.037644004543241925, "percentage": 1.88, "elapsed_time": "0:19:24", "remaining_time": "16:51:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 60, "total_steps": 3080, "loss": 0.5407, "learning_rate": 3.896103896103897e-06, "epoch": 0.03894207366542268, "percentage": 1.95, "elapsed_time": "0:20:03", "remaining_time": "16:49:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 62, "total_steps": 3080, "loss": 0.5437, "learning_rate": 4.025974025974026e-06, "epoch": 0.04024014278760344, "percentage": 2.01, "elapsed_time": "0:20:46", "remaining_time": "16:51:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 64, "total_steps": 3080, "loss": 0.4655, "learning_rate": 4.155844155844157e-06, "epoch": 0.0415382119097842, "percentage": 2.08, "elapsed_time": "0:21:30", "remaining_time": "16:53:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 66, "total_steps": 3080, "loss": 0.4997, "learning_rate": 4.2857142857142855e-06, "epoch": 0.042836281031964955, "percentage": 2.14, "elapsed_time": "0:22:09", "remaining_time": "16:51:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 68, "total_steps": 3080, "loss": 0.4846, "learning_rate": 4.415584415584416e-06, "epoch": 0.044134350154145706, "percentage": 2.21, "elapsed_time": "0:22:46", "remaining_time": "16:48:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 70, "total_steps": 3080, "loss": 0.4522, "learning_rate": 4.5454545454545455e-06, "epoch": 0.04543241927632646, "percentage": 2.27, "elapsed_time": "0:23:28", "remaining_time": "16:49:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 72, "total_steps": 3080, "loss": 0.3711, "learning_rate": 4.675324675324676e-06, "epoch": 0.04673048839850722, "percentage": 2.34, "elapsed_time": "0:24:10", "remaining_time": "16:49:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 74, "total_steps": 3080, "loss": 0.3815, "learning_rate": 4.805194805194806e-06, "epoch": 0.04802855752068798, "percentage": 2.4, "elapsed_time": "0:24:50", "remaining_time": "16:48:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 76, "total_steps": 3080, "loss": 0.4273, "learning_rate": 4.935064935064935e-06, "epoch": 0.049326626642868736, "percentage": 2.47, "elapsed_time": "0:25:29", "remaining_time": "16:47:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 78, "total_steps": 3080, "loss": 0.408, "learning_rate": 5.064935064935065e-06, "epoch": 0.050624695765049486, "percentage": 2.53, "elapsed_time": "0:26:09", "remaining_time": "16:46:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 80, "total_steps": 3080, "loss": 0.388, "learning_rate": 5.194805194805194e-06, "epoch": 0.051922764887230244, "percentage": 2.6, "elapsed_time": "0:26:48", "remaining_time": "16:45:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 82, "total_steps": 3080, "loss": 0.347, "learning_rate": 5.324675324675325e-06, "epoch": 0.053220834009411, "percentage": 2.66, "elapsed_time": "0:27:27", "remaining_time": "16:43:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 84, "total_steps": 3080, "loss": 0.3856, "learning_rate": 5.4545454545454545e-06, "epoch": 0.05451890313159176, "percentage": 2.73, "elapsed_time": "0:28:01", "remaining_time": "16:39:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 86, "total_steps": 3080, "loss": 0.372, "learning_rate": 5.584415584415585e-06, "epoch": 0.055816972253772516, "percentage": 2.79, "elapsed_time": "0:28:39", "remaining_time": "16:37:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 88, "total_steps": 3080, "loss": 0.3667, "learning_rate": 5.7142857142857145e-06, "epoch": 0.05711504137595327, "percentage": 2.86, "elapsed_time": "0:29:19", "remaining_time": "16:36:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 90, "total_steps": 3080, "loss": 0.3881, "learning_rate": 5.844155844155844e-06, "epoch": 0.058413110498134024, "percentage": 2.92, "elapsed_time": "0:29:57", "remaining_time": "16:35:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 92, "total_steps": 3080, "loss": 0.366, "learning_rate": 5.9740259740259746e-06, "epoch": 0.05971117962031478, "percentage": 2.99, "elapsed_time": "0:30:37", "remaining_time": "16:34:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 94, "total_steps": 3080, "loss": 0.3555, "learning_rate": 6.103896103896104e-06, "epoch": 0.06100924874249554, "percentage": 3.05, "elapsed_time": "0:31:16", "remaining_time": "16:33:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 96, "total_steps": 3080, "loss": 0.3948, "learning_rate": 6.233766233766234e-06, "epoch": 0.0623073178646763, "percentage": 3.12, "elapsed_time": "0:31:56", "remaining_time": "16:33:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 98, "total_steps": 3080, "loss": 0.3536, "learning_rate": 6.363636363636364e-06, "epoch": 0.06360538698685705, "percentage": 3.18, "elapsed_time": "0:32:34", "remaining_time": "16:31:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 100, "total_steps": 3080, "loss": 0.3367, "learning_rate": 6.493506493506494e-06, "epoch": 0.0649034561090378, "percentage": 3.25, "elapsed_time": "0:33:14", "remaining_time": "16:30:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 102, "total_steps": 3080, "loss": 0.3424, "learning_rate": 6.623376623376624e-06, "epoch": 0.06620152523121857, "percentage": 3.31, "elapsed_time": "0:33:58", "remaining_time": "16:31:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 104, "total_steps": 3080, "loss": 0.3337, "learning_rate": 6.753246753246754e-06, "epoch": 0.06749959435339932, "percentage": 3.38, "elapsed_time": "0:34:42", "remaining_time": "16:33:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 106, "total_steps": 3080, "loss": 0.3646, "learning_rate": 6.8831168831168835e-06, "epoch": 0.06879766347558007, "percentage": 3.44, "elapsed_time": "0:35:21", "remaining_time": "16:31:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 108, "total_steps": 3080, "loss": 0.3351, "learning_rate": 7.012987012987014e-06, "epoch": 0.07009573259776083, "percentage": 3.51, "elapsed_time": "0:36:01", "remaining_time": "16:31:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 110, "total_steps": 3080, "loss": 0.3414, "learning_rate": 7.1428571428571436e-06, "epoch": 0.07139380171994159, "percentage": 3.57, "elapsed_time": "0:36:39", "remaining_time": "16:29:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 112, "total_steps": 3080, "loss": 0.3445, "learning_rate": 7.272727272727273e-06, "epoch": 0.07269187084212235, "percentage": 3.64, "elapsed_time": "0:37:18", "remaining_time": "16:28:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 114, "total_steps": 3080, "loss": 0.3645, "learning_rate": 7.402597402597404e-06, "epoch": 0.0739899399643031, "percentage": 3.7, "elapsed_time": "0:38:01", "remaining_time": "16:29:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 116, "total_steps": 3080, "loss": 0.3386, "learning_rate": 7.532467532467533e-06, "epoch": 0.07528800908648385, "percentage": 3.77, "elapsed_time": "0:38:37", "remaining_time": "16:27:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 118, "total_steps": 3080, "loss": 0.3298, "learning_rate": 7.662337662337663e-06, "epoch": 0.07658607820866462, "percentage": 3.83, "elapsed_time": "0:39:17", "remaining_time": "16:26:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 120, "total_steps": 3080, "loss": 0.3667, "learning_rate": 7.792207792207793e-06, "epoch": 0.07788414733084537, "percentage": 3.9, "elapsed_time": "0:39:56", "remaining_time": "16:25:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 122, "total_steps": 3080, "loss": 0.3581, "learning_rate": 7.922077922077924e-06, "epoch": 0.07918221645302613, "percentage": 3.96, "elapsed_time": "0:40:33", "remaining_time": "16:23:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 124, "total_steps": 3080, "loss": 0.3472, "learning_rate": 8.051948051948052e-06, "epoch": 0.08048028557520688, "percentage": 4.03, "elapsed_time": "0:41:19", "remaining_time": "16:24:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 126, "total_steps": 3080, "loss": 0.3731, "learning_rate": 8.181818181818183e-06, "epoch": 0.08177835469738763, "percentage": 4.09, "elapsed_time": "0:42:03", "remaining_time": "16:25:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 128, "total_steps": 3080, "loss": 0.3662, "learning_rate": 8.311688311688313e-06, "epoch": 0.0830764238195684, "percentage": 4.16, "elapsed_time": "0:42:46", "remaining_time": "16:26:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 130, "total_steps": 3080, "loss": 0.4006, "learning_rate": 8.441558441558442e-06, "epoch": 0.08437449294174915, "percentage": 4.22, "elapsed_time": "0:43:29", "remaining_time": "16:26:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 132, "total_steps": 3080, "loss": 0.3308, "learning_rate": 8.571428571428571e-06, "epoch": 0.08567256206392991, "percentage": 4.29, "elapsed_time": "0:44:06", "remaining_time": "16:25:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 134, "total_steps": 3080, "loss": 0.3306, "learning_rate": 8.701298701298701e-06, "epoch": 0.08697063118611066, "percentage": 4.35, "elapsed_time": "0:44:45", "remaining_time": "16:23:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 136, "total_steps": 3080, "loss": 0.3972, "learning_rate": 8.831168831168832e-06, "epoch": 0.08826870030829141, "percentage": 4.42, "elapsed_time": "0:45:30", "remaining_time": "16:24:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 138, "total_steps": 3080, "loss": 0.3602, "learning_rate": 8.96103896103896e-06, "epoch": 0.08956676943047218, "percentage": 4.48, "elapsed_time": "0:46:08", "remaining_time": "16:23:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 140, "total_steps": 3080, "loss": 0.3551, "learning_rate": 9.090909090909091e-06, "epoch": 0.09086483855265293, "percentage": 4.55, "elapsed_time": "0:46:46", "remaining_time": "16:22:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 142, "total_steps": 3080, "loss": 0.3412, "learning_rate": 9.220779220779221e-06, "epoch": 0.09216290767483369, "percentage": 4.61, "elapsed_time": "0:47:27", "remaining_time": "16:21:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 144, "total_steps": 3080, "loss": 0.3265, "learning_rate": 9.350649350649352e-06, "epoch": 0.09346097679701444, "percentage": 4.68, "elapsed_time": "0:48:03", "remaining_time": "16:19:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 146, "total_steps": 3080, "loss": 0.3353, "learning_rate": 9.48051948051948e-06, "epoch": 0.09475904591919519, "percentage": 4.74, "elapsed_time": "0:48:44", "remaining_time": "16:19:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 148, "total_steps": 3080, "loss": 0.3603, "learning_rate": 9.610389610389611e-06, "epoch": 0.09605711504137596, "percentage": 4.81, "elapsed_time": "0:49:23", "remaining_time": "16:18:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 150, "total_steps": 3080, "loss": 0.3707, "learning_rate": 9.740259740259742e-06, "epoch": 0.09735518416355671, "percentage": 4.87, "elapsed_time": "0:50:07", "remaining_time": "16:19:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 152, "total_steps": 3080, "loss": 0.3549, "learning_rate": 9.87012987012987e-06, "epoch": 0.09865325328573747, "percentage": 4.94, "elapsed_time": "0:50:51", "remaining_time": "16:19:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 154, "total_steps": 3080, "loss": 0.32, "learning_rate": 1e-05, "epoch": 0.09995132240791822, "percentage": 5.0, "elapsed_time": "0:51:30", "remaining_time": "16:18:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 156, "total_steps": 3080, "loss": 0.3527, "learning_rate": 9.999988472080506e-06, "epoch": 0.10124939153009897, "percentage": 5.06, "elapsed_time": "0:52:08", "remaining_time": "16:17:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 158, "total_steps": 3080, "loss": 0.3368, "learning_rate": 9.999953888375178e-06, "epoch": 0.10254746065227974, "percentage": 5.13, "elapsed_time": "0:52:49", "remaining_time": "16:16:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 160, "total_steps": 3080, "loss": 0.345, "learning_rate": 9.999896249043488e-06, "epoch": 0.10384552977446049, "percentage": 5.19, "elapsed_time": "0:53:31", "remaining_time": "16:16:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 162, "total_steps": 3080, "loss": 0.3544, "learning_rate": 9.999815554351224e-06, "epoch": 0.10514359889664125, "percentage": 5.26, "elapsed_time": "0:54:10", "remaining_time": "16:15:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 164, "total_steps": 3080, "loss": 0.3177, "learning_rate": 9.999711804670478e-06, "epoch": 0.106441668018822, "percentage": 5.32, "elapsed_time": "0:54:53", "remaining_time": "16:15:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 166, "total_steps": 3080, "loss": 0.3642, "learning_rate": 9.999585000479658e-06, "epoch": 0.10773973714100275, "percentage": 5.39, "elapsed_time": "0:55:33", "remaining_time": "16:15:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 168, "total_steps": 3080, "loss": 0.3599, "learning_rate": 9.999435142363484e-06, "epoch": 0.10903780626318352, "percentage": 5.45, "elapsed_time": "0:56:14", "remaining_time": "16:14:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 170, "total_steps": 3080, "loss": 0.3509, "learning_rate": 9.999262231012971e-06, "epoch": 0.11033587538536427, "percentage": 5.52, "elapsed_time": "0:56:55", "remaining_time": "16:14:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 172, "total_steps": 3080, "loss": 0.339, "learning_rate": 9.999066267225447e-06, "epoch": 0.11163394450754503, "percentage": 5.58, "elapsed_time": "0:57:34", "remaining_time": "16:13:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 174, "total_steps": 3080, "loss": 0.3526, "learning_rate": 9.998847251904529e-06, "epoch": 0.11293201362972578, "percentage": 5.65, "elapsed_time": "0:58:11", "remaining_time": "16:11:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 176, "total_steps": 3080, "loss": 0.3286, "learning_rate": 9.998605186060138e-06, "epoch": 0.11423008275190653, "percentage": 5.71, "elapsed_time": "0:58:47", "remaining_time": "16:10:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 178, "total_steps": 3080, "loss": 0.3522, "learning_rate": 9.998340070808478e-06, "epoch": 0.1155281518740873, "percentage": 5.78, "elapsed_time": "0:59:29", "remaining_time": "16:09:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 180, "total_steps": 3080, "loss": 0.3546, "learning_rate": 9.99805190737204e-06, "epoch": 0.11682622099626805, "percentage": 5.84, "elapsed_time": "1:00:08", "remaining_time": "16:08:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 182, "total_steps": 3080, "loss": 0.3295, "learning_rate": 9.997740697079595e-06, "epoch": 0.11812429011844881, "percentage": 5.91, "elapsed_time": "1:00:43", "remaining_time": "16:07:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 184, "total_steps": 3080, "loss": 0.3439, "learning_rate": 9.997406441366182e-06, "epoch": 0.11942235924062956, "percentage": 5.97, "elapsed_time": "1:01:25", "remaining_time": "16:06:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 186, "total_steps": 3080, "loss": 0.3635, "learning_rate": 9.997049141773117e-06, "epoch": 0.12072042836281031, "percentage": 6.04, "elapsed_time": "1:02:07", "remaining_time": "16:06:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 188, "total_steps": 3080, "loss": 0.342, "learning_rate": 9.996668799947962e-06, "epoch": 0.12201849748499108, "percentage": 6.1, "elapsed_time": "1:02:45", "remaining_time": "16:05:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 190, "total_steps": 3080, "loss": 0.322, "learning_rate": 9.99626541764454e-06, "epoch": 0.12331656660717183, "percentage": 6.17, "elapsed_time": "1:03:26", "remaining_time": "16:04:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 192, "total_steps": 3080, "loss": 0.3706, "learning_rate": 9.995838996722916e-06, "epoch": 0.1246146357293526, "percentage": 6.23, "elapsed_time": "1:04:03", "remaining_time": "16:03:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 194, "total_steps": 3080, "loss": 0.3224, "learning_rate": 9.995389539149386e-06, "epoch": 0.12591270485153336, "percentage": 6.3, "elapsed_time": "1:04:47", "remaining_time": "16:03:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 196, "total_steps": 3080, "loss": 0.3507, "learning_rate": 9.994917046996472e-06, "epoch": 0.1272107739737141, "percentage": 6.36, "elapsed_time": "1:05:27", "remaining_time": "16:03:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 198, "total_steps": 3080, "loss": 0.3375, "learning_rate": 9.99442152244292e-06, "epoch": 0.12850884309589486, "percentage": 6.43, "elapsed_time": "1:06:09", "remaining_time": "16:02:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 200, "total_steps": 3080, "loss": 0.3355, "learning_rate": 9.993902967773674e-06, "epoch": 0.1298069122180756, "percentage": 6.49, "elapsed_time": "1:06:50", "remaining_time": "16:02:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 202, "total_steps": 3080, "loss": 0.3303, "learning_rate": 9.993361385379876e-06, "epoch": 0.13110498134025636, "percentage": 6.56, "elapsed_time": "1:07:28", "remaining_time": "16:01:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 204, "total_steps": 3080, "loss": 0.3539, "learning_rate": 9.992796777758855e-06, "epoch": 0.13240305046243714, "percentage": 6.62, "elapsed_time": "1:08:07", "remaining_time": "16:00:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 206, "total_steps": 3080, "loss": 0.3123, "learning_rate": 9.992209147514108e-06, "epoch": 0.1337011195846179, "percentage": 6.69, "elapsed_time": "1:08:47", "remaining_time": "15:59:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 208, "total_steps": 3080, "loss": 0.3491, "learning_rate": 9.991598497355304e-06, "epoch": 0.13499918870679864, "percentage": 6.75, "elapsed_time": "1:09:26", "remaining_time": "15:58:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 210, "total_steps": 3080, "loss": 0.358, "learning_rate": 9.990964830098246e-06, "epoch": 0.1362972578289794, "percentage": 6.82, "elapsed_time": "1:10:11", "remaining_time": "15:59:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 212, "total_steps": 3080, "loss": 0.321, "learning_rate": 9.990308148664882e-06, "epoch": 0.13759532695116014, "percentage": 6.88, "elapsed_time": "1:10:54", "remaining_time": "15:59:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 214, "total_steps": 3080, "loss": 0.3341, "learning_rate": 9.989628456083283e-06, "epoch": 0.13889339607334092, "percentage": 6.95, "elapsed_time": "1:11:31", "remaining_time": "15:57:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 216, "total_steps": 3080, "loss": 0.3606, "learning_rate": 9.988925755487622e-06, "epoch": 0.14019146519552167, "percentage": 7.01, "elapsed_time": "1:12:10", "remaining_time": "15:56:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 218, "total_steps": 3080, "loss": 0.3554, "learning_rate": 9.98820005011817e-06, "epoch": 0.14148953431770242, "percentage": 7.08, "elapsed_time": "1:12:52", "remaining_time": "15:56:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 220, "total_steps": 3080, "loss": 0.337, "learning_rate": 9.98745134332128e-06, "epoch": 0.14278760343988317, "percentage": 7.14, "elapsed_time": "1:13:32", "remaining_time": "15:56:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 222, "total_steps": 3080, "loss": 0.3436, "learning_rate": 9.98667963854936e-06, "epoch": 0.14408567256206392, "percentage": 7.21, "elapsed_time": "1:14:11", "remaining_time": "15:55:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 224, "total_steps": 3080, "loss": 0.356, "learning_rate": 9.985884939360873e-06, "epoch": 0.1453837416842447, "percentage": 7.27, "elapsed_time": "1:14:53", "remaining_time": "15:54:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 226, "total_steps": 3080, "loss": 0.3241, "learning_rate": 9.985067249420308e-06, "epoch": 0.14668181080642545, "percentage": 7.34, "elapsed_time": "1:15:31", "remaining_time": "15:53:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 228, "total_steps": 3080, "loss": 0.3095, "learning_rate": 9.984226572498173e-06, "epoch": 0.1479798799286062, "percentage": 7.4, "elapsed_time": "1:16:13", "remaining_time": "15:53:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 230, "total_steps": 3080, "loss": 0.3292, "learning_rate": 9.983362912470967e-06, "epoch": 0.14927794905078695, "percentage": 7.47, "elapsed_time": "1:16:54", "remaining_time": "15:52:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 232, "total_steps": 3080, "loss": 0.3428, "learning_rate": 9.982476273321175e-06, "epoch": 0.1505760181729677, "percentage": 7.53, "elapsed_time": "1:17:32", "remaining_time": "15:51:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 234, "total_steps": 3080, "loss": 0.3245, "learning_rate": 9.981566659137238e-06, "epoch": 0.15187408729514848, "percentage": 7.6, "elapsed_time": "1:18:14", "remaining_time": "15:51:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 236, "total_steps": 3080, "loss": 0.3447, "learning_rate": 9.980634074113538e-06, "epoch": 0.15317215641732923, "percentage": 7.66, "elapsed_time": "1:18:51", "remaining_time": "15:50:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 238, "total_steps": 3080, "loss": 0.3328, "learning_rate": 9.979678522550382e-06, "epoch": 0.15447022553950998, "percentage": 7.73, "elapsed_time": "1:19:32", "remaining_time": "15:49:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 240, "total_steps": 3080, "loss": 0.3513, "learning_rate": 9.97870000885398e-06, "epoch": 0.15576829466169073, "percentage": 7.79, "elapsed_time": "1:20:14", "remaining_time": "15:49:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 242, "total_steps": 3080, "loss": 0.3047, "learning_rate": 9.97769853753642e-06, "epoch": 0.15706636378387148, "percentage": 7.86, "elapsed_time": "1:20:57", "remaining_time": "15:49:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 244, "total_steps": 3080, "loss": 0.3237, "learning_rate": 9.976674113215655e-06, "epoch": 0.15836443290605226, "percentage": 7.92, "elapsed_time": "1:21:36", "remaining_time": "15:48:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 246, "total_steps": 3080, "loss": 0.3276, "learning_rate": 9.975626740615478e-06, "epoch": 0.159662502028233, "percentage": 7.99, "elapsed_time": "1:22:15", "remaining_time": "15:47:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 248, "total_steps": 3080, "loss": 0.319, "learning_rate": 9.974556424565503e-06, "epoch": 0.16096057115041376, "percentage": 8.05, "elapsed_time": "1:22:59", "remaining_time": "15:47:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 250, "total_steps": 3080, "loss": 0.3259, "learning_rate": 9.973463170001131e-06, "epoch": 0.1622586402725945, "percentage": 8.12, "elapsed_time": "1:23:41", "remaining_time": "15:47:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 252, "total_steps": 3080, "loss": 0.3016, "learning_rate": 9.972346981963546e-06, "epoch": 0.16355670939477526, "percentage": 8.18, "elapsed_time": "1:24:21", "remaining_time": "15:46:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 254, "total_steps": 3080, "loss": 0.3151, "learning_rate": 9.971207865599679e-06, "epoch": 0.16485477851695604, "percentage": 8.25, "elapsed_time": "1:25:02", "remaining_time": "15:46:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 256, "total_steps": 3080, "loss": 0.3193, "learning_rate": 9.970045826162182e-06, "epoch": 0.1661528476391368, "percentage": 8.31, "elapsed_time": "1:25:43", "remaining_time": "15:45:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 258, "total_steps": 3080, "loss": 0.3412, "learning_rate": 9.96886086900942e-06, "epoch": 0.16745091676131754, "percentage": 8.38, "elapsed_time": "1:26:20", "remaining_time": "15:44:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 260, "total_steps": 3080, "loss": 0.324, "learning_rate": 9.967652999605424e-06, "epoch": 0.1687489858834983, "percentage": 8.44, "elapsed_time": "1:27:00", "remaining_time": "15:43:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 262, "total_steps": 3080, "loss": 0.3476, "learning_rate": 9.966422223519887e-06, "epoch": 0.17004705500567904, "percentage": 8.51, "elapsed_time": "1:27:39", "remaining_time": "15:42:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 264, "total_steps": 3080, "loss": 0.3333, "learning_rate": 9.965168546428122e-06, "epoch": 0.17134512412785982, "percentage": 8.57, "elapsed_time": "1:28:17", "remaining_time": "15:41:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 266, "total_steps": 3080, "loss": 0.3283, "learning_rate": 9.963891974111042e-06, "epoch": 0.17264319325004057, "percentage": 8.64, "elapsed_time": "1:28:57", "remaining_time": "15:41:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 268, "total_steps": 3080, "loss": 0.3187, "learning_rate": 9.96259251245514e-06, "epoch": 0.17394126237222132, "percentage": 8.7, "elapsed_time": "1:29:39", "remaining_time": "15:40:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 270, "total_steps": 3080, "loss": 0.3162, "learning_rate": 9.961270167452449e-06, "epoch": 0.17523933149440207, "percentage": 8.77, "elapsed_time": "1:30:21", "remaining_time": "15:40:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 272, "total_steps": 3080, "loss": 0.3442, "learning_rate": 9.959924945200525e-06, "epoch": 0.17653740061658282, "percentage": 8.83, "elapsed_time": "1:31:02", "remaining_time": "15:39:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 274, "total_steps": 3080, "loss": 0.3248, "learning_rate": 9.958556851902414e-06, "epoch": 0.1778354697387636, "percentage": 8.9, "elapsed_time": "1:31:46", "remaining_time": "15:39:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 276, "total_steps": 3080, "loss": 0.314, "learning_rate": 9.957165893866623e-06, "epoch": 0.17913353886094435, "percentage": 8.96, "elapsed_time": "1:32:24", "remaining_time": "15:38:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 278, "total_steps": 3080, "loss": 0.3207, "learning_rate": 9.955752077507093e-06, "epoch": 0.1804316079831251, "percentage": 9.03, "elapsed_time": "1:33:05", "remaining_time": "15:38:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 280, "total_steps": 3080, "loss": 0.3166, "learning_rate": 9.95431540934317e-06, "epoch": 0.18172967710530585, "percentage": 9.09, "elapsed_time": "1:33:42", "remaining_time": "15:37:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 282, "total_steps": 3080, "loss": 0.3198, "learning_rate": 9.952855895999567e-06, "epoch": 0.1830277462274866, "percentage": 9.16, "elapsed_time": "1:34:19", "remaining_time": "15:35:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 284, "total_steps": 3080, "loss": 0.3227, "learning_rate": 9.951373544206352e-06, "epoch": 0.18432581534966738, "percentage": 9.22, "elapsed_time": "1:35:01", "remaining_time": "15:35:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 286, "total_steps": 3080, "loss": 0.3325, "learning_rate": 9.949868360798893e-06, "epoch": 0.18562388447184813, "percentage": 9.29, "elapsed_time": "1:35:42", "remaining_time": "15:34:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 288, "total_steps": 3080, "loss": 0.3007, "learning_rate": 9.948340352717845e-06, "epoch": 0.18692195359402888, "percentage": 9.35, "elapsed_time": "1:36:21", "remaining_time": "15:34:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 290, "total_steps": 3080, "loss": 0.3168, "learning_rate": 9.946789527009108e-06, "epoch": 0.18822002271620963, "percentage": 9.42, "elapsed_time": "1:37:02", "remaining_time": "15:33:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 292, "total_steps": 3080, "loss": 0.3234, "learning_rate": 9.9452158908238e-06, "epoch": 0.18951809183839038, "percentage": 9.48, "elapsed_time": "1:37:43", "remaining_time": "15:32:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 294, "total_steps": 3080, "loss": 0.3549, "learning_rate": 9.943619451418225e-06, "epoch": 0.19081616096057116, "percentage": 9.55, "elapsed_time": "1:38:20", "remaining_time": "15:31:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 296, "total_steps": 3080, "loss": 0.3219, "learning_rate": 9.942000216153829e-06, "epoch": 0.1921142300827519, "percentage": 9.61, "elapsed_time": "1:39:01", "remaining_time": "15:31:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 298, "total_steps": 3080, "loss": 0.3177, "learning_rate": 9.940358192497178e-06, "epoch": 0.19341229920493266, "percentage": 9.68, "elapsed_time": "1:39:41", "remaining_time": "15:30:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 300, "total_steps": 3080, "loss": 0.3151, "learning_rate": 9.93869338801992e-06, "epoch": 0.19471036832711341, "percentage": 9.74, "elapsed_time": "1:40:24", "remaining_time": "15:30:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 302, "total_steps": 3080, "loss": 0.3183, "learning_rate": 9.937005810398747e-06, "epoch": 0.19600843744929417, "percentage": 9.81, "elapsed_time": "1:41:01", "remaining_time": "15:29:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 304, "total_steps": 3080, "loss": 0.3382, "learning_rate": 9.935295467415363e-06, "epoch": 0.19730650657147494, "percentage": 9.87, "elapsed_time": "1:41:38", "remaining_time": "15:28:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 306, "total_steps": 3080, "loss": 0.327, "learning_rate": 9.933562366956445e-06, "epoch": 0.1986045756936557, "percentage": 9.94, "elapsed_time": "1:42:20", "remaining_time": "15:27:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 308, "total_steps": 3080, "loss": 0.3025, "learning_rate": 9.931806517013612e-06, "epoch": 0.19990264481583644, "percentage": 10.0, "elapsed_time": "1:42:59", "remaining_time": "15:26:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 310, "total_steps": 3080, "loss": 0.3499, "learning_rate": 9.930027925683384e-06, "epoch": 0.2012007139380172, "percentage": 10.06, "elapsed_time": "1:43:40", "remaining_time": "15:26:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 312, "total_steps": 3080, "loss": 0.3319, "learning_rate": 9.928226601167139e-06, "epoch": 0.20249878306019795, "percentage": 10.13, "elapsed_time": "1:44:19", "remaining_time": "15:25:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 314, "total_steps": 3080, "loss": 0.3031, "learning_rate": 9.92640255177109e-06, "epoch": 0.20379685218237872, "percentage": 10.19, "elapsed_time": "1:44:59", "remaining_time": "15:24:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 316, "total_steps": 3080, "loss": 0.3245, "learning_rate": 9.924555785906235e-06, "epoch": 0.20509492130455947, "percentage": 10.26, "elapsed_time": "1:45:36", "remaining_time": "15:23:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 318, "total_steps": 3080, "loss": 0.3003, "learning_rate": 9.922686312088323e-06, "epoch": 0.20639299042674022, "percentage": 10.32, "elapsed_time": "1:46:16", "remaining_time": "15:23:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 320, "total_steps": 3080, "loss": 0.3258, "learning_rate": 9.920794138937807e-06, "epoch": 0.20769105954892098, "percentage": 10.39, "elapsed_time": "1:46:52", "remaining_time": "15:21:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 322, "total_steps": 3080, "loss": 0.3447, "learning_rate": 9.918879275179819e-06, "epoch": 0.20898912867110173, "percentage": 10.45, "elapsed_time": "1:47:33", "remaining_time": "15:21:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 324, "total_steps": 3080, "loss": 0.3075, "learning_rate": 9.916941729644112e-06, "epoch": 0.2102871977932825, "percentage": 10.52, "elapsed_time": "1:48:12", "remaining_time": "15:20:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 326, "total_steps": 3080, "loss": 0.3392, "learning_rate": 9.914981511265039e-06, "epoch": 0.21158526691546325, "percentage": 10.58, "elapsed_time": "1:48:50", "remaining_time": "15:19:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 328, "total_steps": 3080, "loss": 0.3018, "learning_rate": 9.912998629081495e-06, "epoch": 0.212883336037644, "percentage": 10.65, "elapsed_time": "1:49:27", "remaining_time": "15:18:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 330, "total_steps": 3080, "loss": 0.3241, "learning_rate": 9.910993092236878e-06, "epoch": 0.21418140515982476, "percentage": 10.71, "elapsed_time": "1:50:05", "remaining_time": "15:17:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 332, "total_steps": 3080, "loss": 0.2979, "learning_rate": 9.90896490997906e-06, "epoch": 0.2154794742820055, "percentage": 10.78, "elapsed_time": "1:50:46", "remaining_time": "15:16:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 334, "total_steps": 3080, "loss": 0.3036, "learning_rate": 9.906914091660327e-06, "epoch": 0.21677754340418628, "percentage": 10.84, "elapsed_time": "1:51:27", "remaining_time": "15:16:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 336, "total_steps": 3080, "loss": 0.3457, "learning_rate": 9.904840646737346e-06, "epoch": 0.21807561252636704, "percentage": 10.91, "elapsed_time": "1:52:09", "remaining_time": "15:16:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 338, "total_steps": 3080, "loss": 0.3235, "learning_rate": 9.902744584771123e-06, "epoch": 0.21937368164854779, "percentage": 10.97, "elapsed_time": "1:52:49", "remaining_time": "15:15:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 340, "total_steps": 3080, "loss": 0.2932, "learning_rate": 9.900625915426948e-06, "epoch": 0.22067175077072854, "percentage": 11.04, "elapsed_time": "1:53:28", "remaining_time": "15:14:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 342, "total_steps": 3080, "loss": 0.3243, "learning_rate": 9.898484648474362e-06, "epoch": 0.2219698198929093, "percentage": 11.1, "elapsed_time": "1:54:10", "remaining_time": "15:14:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 344, "total_steps": 3080, "loss": 0.3184, "learning_rate": 9.896320793787106e-06, "epoch": 0.22326788901509007, "percentage": 11.17, "elapsed_time": "1:54:52", "remaining_time": "15:13:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 346, "total_steps": 3080, "loss": 0.3394, "learning_rate": 9.894134361343077e-06, "epoch": 0.22456595813727082, "percentage": 11.23, "elapsed_time": "1:55:37", "remaining_time": "15:13:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 348, "total_steps": 3080, "loss": 0.327, "learning_rate": 9.891925361224284e-06, "epoch": 0.22586402725945157, "percentage": 11.3, "elapsed_time": "1:56:18", "remaining_time": "15:13:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 350, "total_steps": 3080, "loss": 0.3652, "learning_rate": 9.889693803616793e-06, "epoch": 0.22716209638163232, "percentage": 11.36, "elapsed_time": "1:56:56", "remaining_time": "15:12:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 352, "total_steps": 3080, "loss": 0.314, "learning_rate": 9.887439698810694e-06, "epoch": 0.22846016550381307, "percentage": 11.43, "elapsed_time": "1:57:32", "remaining_time": "15:10:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 354, "total_steps": 3080, "loss": 0.3081, "learning_rate": 9.88516305720004e-06, "epoch": 0.22975823462599385, "percentage": 11.49, "elapsed_time": "1:58:14", "remaining_time": "15:10:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 356, "total_steps": 3080, "loss": 0.3154, "learning_rate": 9.88286388928281e-06, "epoch": 0.2310563037481746, "percentage": 11.56, "elapsed_time": "1:58:51", "remaining_time": "15:09:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 358, "total_steps": 3080, "loss": 0.3115, "learning_rate": 9.880542205660853e-06, "epoch": 0.23235437287035535, "percentage": 11.62, "elapsed_time": "1:59:27", "remaining_time": "15:08:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 360, "total_steps": 3080, "loss": 0.2975, "learning_rate": 9.878198017039839e-06, "epoch": 0.2336524419925361, "percentage": 11.69, "elapsed_time": "2:00:06", "remaining_time": "15:07:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 362, "total_steps": 3080, "loss": 0.2996, "learning_rate": 9.875831334229217e-06, "epoch": 0.23495051111471685, "percentage": 11.75, "elapsed_time": "2:00:45", "remaining_time": "15:06:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 364, "total_steps": 3080, "loss": 0.2892, "learning_rate": 9.873442168142158e-06, "epoch": 0.23624858023689763, "percentage": 11.82, "elapsed_time": "2:01:25", "remaining_time": "15:06:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 366, "total_steps": 3080, "loss": 0.3073, "learning_rate": 9.87103052979551e-06, "epoch": 0.23754664935907838, "percentage": 11.88, "elapsed_time": "2:02:06", "remaining_time": "15:05:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 368, "total_steps": 3080, "loss": 0.3216, "learning_rate": 9.868596430309739e-06, "epoch": 0.23884471848125913, "percentage": 11.95, "elapsed_time": "2:02:45", "remaining_time": "15:04:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 370, "total_steps": 3080, "loss": 0.3071, "learning_rate": 9.866139880908887e-06, "epoch": 0.24014278760343988, "percentage": 12.01, "elapsed_time": "2:03:25", "remaining_time": "15:03:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 372, "total_steps": 3080, "loss": 0.3239, "learning_rate": 9.863660892920514e-06, "epoch": 0.24144085672562063, "percentage": 12.08, "elapsed_time": "2:04:06", "remaining_time": "15:03:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 374, "total_steps": 3080, "loss": 0.3079, "learning_rate": 9.861159477775653e-06, "epoch": 0.2427389258478014, "percentage": 12.14, "elapsed_time": "2:04:49", "remaining_time": "15:03:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 376, "total_steps": 3080, "loss": 0.3124, "learning_rate": 9.858635647008747e-06, "epoch": 0.24403699496998216, "percentage": 12.21, "elapsed_time": "2:05:26", "remaining_time": "15:02:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 378, "total_steps": 3080, "loss": 0.3067, "learning_rate": 9.856089412257605e-06, "epoch": 0.2453350640921629, "percentage": 12.27, "elapsed_time": "2:06:06", "remaining_time": "15:01:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 380, "total_steps": 3080, "loss": 0.308, "learning_rate": 9.85352078526334e-06, "epoch": 0.24663313321434366, "percentage": 12.34, "elapsed_time": "2:06:48", "remaining_time": "15:01:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 382, "total_steps": 3080, "loss": 0.3277, "learning_rate": 9.850929777870324e-06, "epoch": 0.2479312023365244, "percentage": 12.4, "elapsed_time": "2:07:27", "remaining_time": "15:00:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 384, "total_steps": 3080, "loss": 0.2848, "learning_rate": 9.848316402026125e-06, "epoch": 0.2492292714587052, "percentage": 12.47, "elapsed_time": "2:08:09", "remaining_time": "14:59:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 386, "total_steps": 3080, "loss": 0.2932, "learning_rate": 9.845680669781459e-06, "epoch": 0.25052734058088594, "percentage": 12.53, "elapsed_time": "2:08:49", "remaining_time": "14:59:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 388, "total_steps": 3080, "loss": 0.3067, "learning_rate": 9.843022593290129e-06, "epoch": 0.2518254097030667, "percentage": 12.6, "elapsed_time": "2:09:26", "remaining_time": "14:58:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 390, "total_steps": 3080, "loss": 0.3132, "learning_rate": 9.840342184808973e-06, "epoch": 0.25312347882524744, "percentage": 12.66, "elapsed_time": "2:10:06", "remaining_time": "14:57:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 392, "total_steps": 3080, "loss": 0.2996, "learning_rate": 9.837639456697802e-06, "epoch": 0.2544215479474282, "percentage": 12.73, "elapsed_time": "2:10:46", "remaining_time": "14:56:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 394, "total_steps": 3080, "loss": 0.3138, "learning_rate": 9.83491442141935e-06, "epoch": 0.25571961706960894, "percentage": 12.79, "elapsed_time": "2:11:28", "remaining_time": "14:56:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 396, "total_steps": 3080, "loss": 0.3257, "learning_rate": 9.832167091539215e-06, "epoch": 0.2570176861917897, "percentage": 12.86, "elapsed_time": "2:12:14", "remaining_time": "14:56:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 398, "total_steps": 3080, "loss": 0.3049, "learning_rate": 9.829397479725791e-06, "epoch": 0.2583157553139705, "percentage": 12.92, "elapsed_time": "2:12:54", "remaining_time": "14:55:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 400, "total_steps": 3080, "loss": 0.3137, "learning_rate": 9.826605598750223e-06, "epoch": 0.2596138244361512, "percentage": 12.99, "elapsed_time": "2:13:34", "remaining_time": "14:54:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 402, "total_steps": 3080, "loss": 0.2843, "learning_rate": 9.823791461486348e-06, "epoch": 0.260911893558332, "percentage": 13.05, "elapsed_time": "2:14:13", "remaining_time": "14:54:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 404, "total_steps": 3080, "loss": 0.3454, "learning_rate": 9.82095508091062e-06, "epoch": 0.2622099626805127, "percentage": 13.12, "elapsed_time": "2:14:58", "remaining_time": "14:54:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 406, "total_steps": 3080, "loss": 0.2926, "learning_rate": 9.818096470102067e-06, "epoch": 0.2635080318026935, "percentage": 13.18, "elapsed_time": "2:15:44", "remaining_time": "14:53:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 408, "total_steps": 3080, "loss": 0.2728, "learning_rate": 9.815215642242224e-06, "epoch": 0.2648061009248743, "percentage": 13.25, "elapsed_time": "2:16:24", "remaining_time": "14:53:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 410, "total_steps": 3080, "loss": 0.3083, "learning_rate": 9.812312610615073e-06, "epoch": 0.266104170047055, "percentage": 13.31, "elapsed_time": "2:17:04", "remaining_time": "14:52:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 412, "total_steps": 3080, "loss": 0.2983, "learning_rate": 9.809387388606977e-06, "epoch": 0.2674022391692358, "percentage": 13.38, "elapsed_time": "2:17:47", "remaining_time": "14:52:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 414, "total_steps": 3080, "loss": 0.2997, "learning_rate": 9.806439989706626e-06, "epoch": 0.2687003082914165, "percentage": 13.44, "elapsed_time": "2:18:29", "remaining_time": "14:51:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 416, "total_steps": 3080, "loss": 0.3182, "learning_rate": 9.803470427504972e-06, "epoch": 0.2699983774135973, "percentage": 13.51, "elapsed_time": "2:19:09", "remaining_time": "14:51:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 418, "total_steps": 3080, "loss": 0.3269, "learning_rate": 9.800478715695165e-06, "epoch": 0.27129644653577806, "percentage": 13.57, "elapsed_time": "2:19:49", "remaining_time": "14:50:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 420, "total_steps": 3080, "loss": 0.3114, "learning_rate": 9.797464868072489e-06, "epoch": 0.2725945156579588, "percentage": 13.64, "elapsed_time": "2:20:25", "remaining_time": "14:49:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 422, "total_steps": 3080, "loss": 0.2928, "learning_rate": 9.794428898534301e-06, "epoch": 0.27389258478013956, "percentage": 13.7, "elapsed_time": "2:21:06", "remaining_time": "14:48:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 424, "total_steps": 3080, "loss": 0.3036, "learning_rate": 9.791370821079967e-06, "epoch": 0.2751906539023203, "percentage": 13.77, "elapsed_time": "2:21:49", "remaining_time": "14:48:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 426, "total_steps": 3080, "loss": 0.3128, "learning_rate": 9.788290649810794e-06, "epoch": 0.27648872302450106, "percentage": 13.83, "elapsed_time": "2:22:34", "remaining_time": "14:48:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 428, "total_steps": 3080, "loss": 0.3139, "learning_rate": 9.78518839892997e-06, "epoch": 0.27778679214668184, "percentage": 13.9, "elapsed_time": "2:23:13", "remaining_time": "14:47:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 430, "total_steps": 3080, "loss": 0.3229, "learning_rate": 9.782064082742494e-06, "epoch": 0.27908486126886256, "percentage": 13.96, "elapsed_time": "2:23:56", "remaining_time": "14:47:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 432, "total_steps": 3080, "loss": 0.3415, "learning_rate": 9.77891771565511e-06, "epoch": 0.28038293039104334, "percentage": 14.03, "elapsed_time": "2:24:39", "remaining_time": "14:46:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 434, "total_steps": 3080, "loss": 0.313, "learning_rate": 9.775749312176249e-06, "epoch": 0.28168099951322406, "percentage": 14.09, "elapsed_time": "2:25:20", "remaining_time": "14:46:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 436, "total_steps": 3080, "loss": 0.3003, "learning_rate": 9.772558886915946e-06, "epoch": 0.28297906863540484, "percentage": 14.16, "elapsed_time": "2:26:00", "remaining_time": "14:45:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 438, "total_steps": 3080, "loss": 0.3103, "learning_rate": 9.76934645458579e-06, "epoch": 0.2842771377575856, "percentage": 14.22, "elapsed_time": "2:26:38", "remaining_time": "14:44:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 440, "total_steps": 3080, "loss": 0.2946, "learning_rate": 9.766112029998847e-06, "epoch": 0.28557520687976634, "percentage": 14.29, "elapsed_time": "2:27:19", "remaining_time": "14:43:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 442, "total_steps": 3080, "loss": 0.3095, "learning_rate": 9.76285562806959e-06, "epoch": 0.2868732760019471, "percentage": 14.35, "elapsed_time": "2:28:00", "remaining_time": "14:43:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 444, "total_steps": 3080, "loss": 0.3245, "learning_rate": 9.759577263813833e-06, "epoch": 0.28817134512412784, "percentage": 14.42, "elapsed_time": "2:28:39", "remaining_time": "14:42:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 446, "total_steps": 3080, "loss": 0.2933, "learning_rate": 9.756276952348666e-06, "epoch": 0.2894694142463086, "percentage": 14.48, "elapsed_time": "2:29:21", "remaining_time": "14:42:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 448, "total_steps": 3080, "loss": 0.2951, "learning_rate": 9.752954708892379e-06, "epoch": 0.2907674833684894, "percentage": 14.55, "elapsed_time": "2:30:03", "remaining_time": "14:41:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 450, "total_steps": 3080, "loss": 0.2948, "learning_rate": 9.749610548764393e-06, "epoch": 0.2920655524906701, "percentage": 14.61, "elapsed_time": "2:30:42", "remaining_time": "14:40:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 452, "total_steps": 3080, "loss": 0.3307, "learning_rate": 9.74624448738519e-06, "epoch": 0.2933636216128509, "percentage": 14.68, "elapsed_time": "2:31:23", "remaining_time": "14:40:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 454, "total_steps": 3080, "loss": 0.3079, "learning_rate": 9.742856540276246e-06, "epoch": 0.2946616907350316, "percentage": 14.74, "elapsed_time": "2:32:01", "remaining_time": "14:39:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 456, "total_steps": 3080, "loss": 0.3372, "learning_rate": 9.739446723059953e-06, "epoch": 0.2959597598572124, "percentage": 14.81, "elapsed_time": "2:32:44", "remaining_time": "14:38:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 458, "total_steps": 3080, "loss": 0.3056, "learning_rate": 9.736015051459551e-06, "epoch": 0.2972578289793932, "percentage": 14.87, "elapsed_time": "2:33:23", "remaining_time": "14:38:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 460, "total_steps": 3080, "loss": 0.3298, "learning_rate": 9.732561541299053e-06, "epoch": 0.2985558981015739, "percentage": 14.94, "elapsed_time": "2:34:07", "remaining_time": "14:37:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 462, "total_steps": 3080, "loss": 0.3087, "learning_rate": 9.729086208503174e-06, "epoch": 0.2998539672237547, "percentage": 15.0, "elapsed_time": "2:34:49", "remaining_time": "14:37:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 464, "total_steps": 3080, "loss": 0.3101, "learning_rate": 9.725589069097257e-06, "epoch": 0.3011520363459354, "percentage": 15.06, "elapsed_time": "2:35:25", "remaining_time": "14:36:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 466, "total_steps": 3080, "loss": 0.3068, "learning_rate": 9.722070139207198e-06, "epoch": 0.3024501054681162, "percentage": 15.13, "elapsed_time": "2:36:05", "remaining_time": "14:35:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 468, "total_steps": 3080, "loss": 0.322, "learning_rate": 9.718529435059372e-06, "epoch": 0.30374817459029696, "percentage": 15.19, "elapsed_time": "2:36:46", "remaining_time": "14:34:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 470, "total_steps": 3080, "loss": 0.3124, "learning_rate": 9.714966972980563e-06, "epoch": 0.3050462437124777, "percentage": 15.26, "elapsed_time": "2:37:25", "remaining_time": "14:34:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 472, "total_steps": 3080, "loss": 0.3119, "learning_rate": 9.711382769397879e-06, "epoch": 0.30634431283465846, "percentage": 15.32, "elapsed_time": "2:38:15", "remaining_time": "14:34:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 474, "total_steps": 3080, "loss": 0.3262, "learning_rate": 9.707776840838685e-06, "epoch": 0.3076423819568392, "percentage": 15.39, "elapsed_time": "2:38:57", "remaining_time": "14:33:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 476, "total_steps": 3080, "loss": 0.3097, "learning_rate": 9.704149203930522e-06, "epoch": 0.30894045107901996, "percentage": 15.45, "elapsed_time": "2:39:34", "remaining_time": "14:32:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 478, "total_steps": 3080, "loss": 0.2844, "learning_rate": 9.700499875401035e-06, "epoch": 0.31023852020120074, "percentage": 15.52, "elapsed_time": "2:40:13", "remaining_time": "14:32:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 480, "total_steps": 3080, "loss": 0.2867, "learning_rate": 9.696828872077885e-06, "epoch": 0.31153658932338146, "percentage": 15.58, "elapsed_time": "2:40:50", "remaining_time": "14:31:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 482, "total_steps": 3080, "loss": 0.2807, "learning_rate": 9.69313621088869e-06, "epoch": 0.31283465844556224, "percentage": 15.65, "elapsed_time": "2:41:30", "remaining_time": "14:30:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 484, "total_steps": 3080, "loss": 0.3504, "learning_rate": 9.689421908860928e-06, "epoch": 0.31413272756774296, "percentage": 15.71, "elapsed_time": "2:42:16", "remaining_time": "14:30:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 486, "total_steps": 3080, "loss": 0.2959, "learning_rate": 9.685685983121867e-06, "epoch": 0.31543079668992374, "percentage": 15.78, "elapsed_time": "2:42:57", "remaining_time": "14:29:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 488, "total_steps": 3080, "loss": 0.3246, "learning_rate": 9.681928450898492e-06, "epoch": 0.3167288658121045, "percentage": 15.84, "elapsed_time": "2:43:40", "remaining_time": "14:29:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 490, "total_steps": 3080, "loss": 0.3034, "learning_rate": 9.67814932951741e-06, "epoch": 0.31802693493428524, "percentage": 15.91, "elapsed_time": "2:44:20", "remaining_time": "14:28:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 492, "total_steps": 3080, "loss": 0.2903, "learning_rate": 9.674348636404784e-06, "epoch": 0.319325004056466, "percentage": 15.97, "elapsed_time": "2:45:01", "remaining_time": "14:28:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 494, "total_steps": 3080, "loss": 0.2828, "learning_rate": 9.670526389086252e-06, "epoch": 0.32062307317864674, "percentage": 16.04, "elapsed_time": "2:45:39", "remaining_time": "14:27:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 496, "total_steps": 3080, "loss": 0.3153, "learning_rate": 9.666682605186834e-06, "epoch": 0.3219211423008275, "percentage": 16.1, "elapsed_time": "2:46:17", "remaining_time": "14:26:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 498, "total_steps": 3080, "loss": 0.3194, "learning_rate": 9.662817302430864e-06, "epoch": 0.3232192114230083, "percentage": 16.17, "elapsed_time": "2:46:56", "remaining_time": "14:25:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 500, "total_steps": 3080, "loss": 0.3011, "learning_rate": 9.658930498641901e-06, "epoch": 0.324517280545189, "percentage": 16.23, "elapsed_time": "2:47:39", "remaining_time": "14:25:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 500, "total_steps": 3080, "eval_loss": 0.30345335602760315, "epoch": 0.324517280545189, "percentage": 16.23, "elapsed_time": "3:01:28", "remaining_time": "15:36:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 502, "total_steps": 3080, "loss": 0.3092, "learning_rate": 9.655022211742651e-06, "epoch": 0.3258153496673698, "percentage": 16.3, "elapsed_time": "3:02:08", "remaining_time": "15:35:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 504, "total_steps": 3080, "loss": 0.2834, "learning_rate": 9.651092459754879e-06, "epoch": 0.3271134187895505, "percentage": 16.36, "elapsed_time": "3:02:50", "remaining_time": "15:34:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 506, "total_steps": 3080, "loss": 0.2841, "learning_rate": 9.64714126079933e-06, "epoch": 0.3284114879117313, "percentage": 16.43, "elapsed_time": "3:03:32", "remaining_time": "15:33:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 508, "total_steps": 3080, "loss": 0.3166, "learning_rate": 9.643168633095647e-06, "epoch": 0.3297095570339121, "percentage": 16.49, "elapsed_time": "3:04:11", "remaining_time": "15:32:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 510, "total_steps": 3080, "loss": 0.3026, "learning_rate": 9.639174594962283e-06, "epoch": 0.3310076261560928, "percentage": 16.56, "elapsed_time": "3:04:53", "remaining_time": "15:31:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 512, "total_steps": 3080, "loss": 0.3047, "learning_rate": 9.635159164816416e-06, "epoch": 0.3323056952782736, "percentage": 16.62, "elapsed_time": "3:05:37", "remaining_time": "15:31:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 514, "total_steps": 3080, "loss": 0.317, "learning_rate": 9.631122361173873e-06, "epoch": 0.3336037644004543, "percentage": 16.69, "elapsed_time": "3:06:16", "remaining_time": "15:29:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 516, "total_steps": 3080, "loss": 0.2818, "learning_rate": 9.627064202649027e-06, "epoch": 0.3349018335226351, "percentage": 16.75, "elapsed_time": "3:06:56", "remaining_time": "15:28:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 518, "total_steps": 3080, "loss": 0.3337, "learning_rate": 9.622984707954732e-06, "epoch": 0.33619990264481586, "percentage": 16.82, "elapsed_time": "3:07:37", "remaining_time": "15:27:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 520, "total_steps": 3080, "loss": 0.275, "learning_rate": 9.61888389590222e-06, "epoch": 0.3374979717669966, "percentage": 16.88, "elapsed_time": "3:08:16", "remaining_time": "15:26:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 522, "total_steps": 3080, "loss": 0.311, "learning_rate": 9.614761785401026e-06, "epoch": 0.33879604088917736, "percentage": 16.95, "elapsed_time": "3:08:58", "remaining_time": "15:26:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 524, "total_steps": 3080, "loss": 0.3133, "learning_rate": 9.610618395458892e-06, "epoch": 0.3400941100113581, "percentage": 17.01, "elapsed_time": "3:09:38", "remaining_time": "15:25:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 526, "total_steps": 3080, "loss": 0.2784, "learning_rate": 9.606453745181682e-06, "epoch": 0.34139217913353886, "percentage": 17.08, "elapsed_time": "3:10:17", "remaining_time": "15:23:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 528, "total_steps": 3080, "loss": 0.2976, "learning_rate": 9.602267853773301e-06, "epoch": 0.34269024825571964, "percentage": 17.14, "elapsed_time": "3:10:57", "remaining_time": "15:22:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 530, "total_steps": 3080, "loss": 0.3007, "learning_rate": 9.598060740535596e-06, "epoch": 0.34398831737790037, "percentage": 17.21, "elapsed_time": "3:11:39", "remaining_time": "15:22:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 532, "total_steps": 3080, "loss": 0.2957, "learning_rate": 9.593832424868271e-06, "epoch": 0.34528638650008114, "percentage": 17.27, "elapsed_time": "3:12:23", "remaining_time": "15:21:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 534, "total_steps": 3080, "loss": 0.2932, "learning_rate": 9.589582926268798e-06, "epoch": 0.34658445562226187, "percentage": 17.34, "elapsed_time": "3:13:05", "remaining_time": "15:20:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 536, "total_steps": 3080, "loss": 0.3114, "learning_rate": 9.585312264332329e-06, "epoch": 0.34788252474444264, "percentage": 17.4, "elapsed_time": "3:13:46", "remaining_time": "15:19:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 538, "total_steps": 3080, "loss": 0.2879, "learning_rate": 9.581020458751604e-06, "epoch": 0.3491805938666234, "percentage": 17.47, "elapsed_time": "3:14:31", "remaining_time": "15:19:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 540, "total_steps": 3080, "loss": 0.2984, "learning_rate": 9.576707529316857e-06, "epoch": 0.35047866298880415, "percentage": 17.53, "elapsed_time": "3:15:10", "remaining_time": "15:18:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 542, "total_steps": 3080, "loss": 0.3052, "learning_rate": 9.572373495915732e-06, "epoch": 0.3517767321109849, "percentage": 17.6, "elapsed_time": "3:15:50", "remaining_time": "15:17:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 544, "total_steps": 3080, "loss": 0.3217, "learning_rate": 9.568018378533181e-06, "epoch": 0.35307480123316565, "percentage": 17.66, "elapsed_time": "3:16:35", "remaining_time": "15:16:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 546, "total_steps": 3080, "loss": 0.2718, "learning_rate": 9.563642197251382e-06, "epoch": 0.3543728703553464, "percentage": 17.73, "elapsed_time": "3:17:14", "remaining_time": "15:15:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 548, "total_steps": 3080, "loss": 0.3133, "learning_rate": 9.559244972249643e-06, "epoch": 0.3556709394775272, "percentage": 17.79, "elapsed_time": "3:17:58", "remaining_time": "15:14:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 550, "total_steps": 3080, "loss": 0.318, "learning_rate": 9.554826723804304e-06, "epoch": 0.3569690085997079, "percentage": 17.86, "elapsed_time": "3:18:40", "remaining_time": "15:13:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 552, "total_steps": 3080, "loss": 0.2963, "learning_rate": 9.550387472288651e-06, "epoch": 0.3582670777218887, "percentage": 17.92, "elapsed_time": "3:19:22", "remaining_time": "15:13:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 554, "total_steps": 3080, "loss": 0.2904, "learning_rate": 9.545927238172817e-06, "epoch": 0.3595651468440694, "percentage": 17.99, "elapsed_time": "3:20:06", "remaining_time": "15:12:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 556, "total_steps": 3080, "loss": 0.2819, "learning_rate": 9.541446042023692e-06, "epoch": 0.3608632159662502, "percentage": 18.05, "elapsed_time": "3:20:46", "remaining_time": "15:11:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 558, "total_steps": 3080, "loss": 0.2898, "learning_rate": 9.53694390450482e-06, "epoch": 0.362161285088431, "percentage": 18.12, "elapsed_time": "3:21:22", "remaining_time": "15:10:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 560, "total_steps": 3080, "loss": 0.295, "learning_rate": 9.532420846376316e-06, "epoch": 0.3634593542106117, "percentage": 18.18, "elapsed_time": "3:22:00", "remaining_time": "15:09:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 562, "total_steps": 3080, "loss": 0.3276, "learning_rate": 9.527876888494758e-06, "epoch": 0.3647574233327925, "percentage": 18.25, "elapsed_time": "3:22:44", "remaining_time": "15:08:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 564, "total_steps": 3080, "loss": 0.2655, "learning_rate": 9.523312051813097e-06, "epoch": 0.3660554924549732, "percentage": 18.31, "elapsed_time": "3:23:22", "remaining_time": "15:07:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 566, "total_steps": 3080, "loss": 0.3245, "learning_rate": 9.518726357380565e-06, "epoch": 0.367353561577154, "percentage": 18.38, "elapsed_time": "3:24:04", "remaining_time": "15:06:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 568, "total_steps": 3080, "loss": 0.2729, "learning_rate": 9.514119826342564e-06, "epoch": 0.36865163069933476, "percentage": 18.44, "elapsed_time": "3:24:47", "remaining_time": "15:05:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 570, "total_steps": 3080, "loss": 0.3293, "learning_rate": 9.509492479940585e-06, "epoch": 0.3699496998215155, "percentage": 18.51, "elapsed_time": "3:25:30", "remaining_time": "15:04:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 572, "total_steps": 3080, "loss": 0.3424, "learning_rate": 9.504844339512096e-06, "epoch": 0.37124776894369627, "percentage": 18.57, "elapsed_time": "3:26:10", "remaining_time": "15:03:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 574, "total_steps": 3080, "loss": 0.2983, "learning_rate": 9.500175426490455e-06, "epoch": 0.372545838065877, "percentage": 18.64, "elapsed_time": "3:26:50", "remaining_time": "15:03:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 576, "total_steps": 3080, "loss": 0.3037, "learning_rate": 9.495485762404801e-06, "epoch": 0.37384390718805777, "percentage": 18.7, "elapsed_time": "3:27:32", "remaining_time": "15:02:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 578, "total_steps": 3080, "loss": 0.2927, "learning_rate": 9.490775368879966e-06, "epoch": 0.37514197631023855, "percentage": 18.77, "elapsed_time": "3:28:11", "remaining_time": "15:01:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 580, "total_steps": 3080, "loss": 0.2858, "learning_rate": 9.486044267636359e-06, "epoch": 0.37644004543241927, "percentage": 18.83, "elapsed_time": "3:28:51", "remaining_time": "15:00:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 582, "total_steps": 3080, "loss": 0.3147, "learning_rate": 9.481292480489885e-06, "epoch": 0.37773811455460005, "percentage": 18.9, "elapsed_time": "3:29:30", "remaining_time": "14:59:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 584, "total_steps": 3080, "loss": 0.298, "learning_rate": 9.476520029351834e-06, "epoch": 0.37903618367678077, "percentage": 18.96, "elapsed_time": "3:30:10", "remaining_time": "14:58:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 586, "total_steps": 3080, "loss": 0.3032, "learning_rate": 9.471726936228775e-06, "epoch": 0.38033425279896155, "percentage": 19.03, "elapsed_time": "3:30:49", "remaining_time": "14:57:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 588, "total_steps": 3080, "loss": 0.2836, "learning_rate": 9.466913223222467e-06, "epoch": 0.3816323219211423, "percentage": 19.09, "elapsed_time": "3:31:28", "remaining_time": "14:56:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 590, "total_steps": 3080, "loss": 0.2974, "learning_rate": 9.462078912529748e-06, "epoch": 0.38293039104332305, "percentage": 19.16, "elapsed_time": "3:32:07", "remaining_time": "14:55:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 592, "total_steps": 3080, "loss": 0.2758, "learning_rate": 9.457224026442435e-06, "epoch": 0.3842284601655038, "percentage": 19.22, "elapsed_time": "3:32:43", "remaining_time": "14:54:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 594, "total_steps": 3080, "loss": 0.2796, "learning_rate": 9.452348587347224e-06, "epoch": 0.38552652928768455, "percentage": 19.29, "elapsed_time": "3:33:21", "remaining_time": "14:52:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 596, "total_steps": 3080, "loss": 0.3012, "learning_rate": 9.447452617725581e-06, "epoch": 0.38682459840986533, "percentage": 19.35, "elapsed_time": "3:34:07", "remaining_time": "14:52:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 598, "total_steps": 3080, "loss": 0.3287, "learning_rate": 9.442536140153644e-06, "epoch": 0.3881226675320461, "percentage": 19.42, "elapsed_time": "3:34:50", "remaining_time": "14:51:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 600, "total_steps": 3080, "loss": 0.2834, "learning_rate": 9.437599177302115e-06, "epoch": 0.38942073665422683, "percentage": 19.48, "elapsed_time": "3:35:36", "remaining_time": "14:51:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 602, "total_steps": 3080, "loss": 0.3194, "learning_rate": 9.432641751936162e-06, "epoch": 0.3907188057764076, "percentage": 19.55, "elapsed_time": "3:36:14", "remaining_time": "14:50:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 604, "total_steps": 3080, "loss": 0.2817, "learning_rate": 9.427663886915302e-06, "epoch": 0.39201687489858833, "percentage": 19.61, "elapsed_time": "3:36:54", "remaining_time": "14:49:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 606, "total_steps": 3080, "loss": 0.2941, "learning_rate": 9.422665605193304e-06, "epoch": 0.3933149440207691, "percentage": 19.68, "elapsed_time": "3:37:33", "remaining_time": "14:48:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 608, "total_steps": 3080, "loss": 0.3345, "learning_rate": 9.417646929818089e-06, "epoch": 0.3946130131429499, "percentage": 19.74, "elapsed_time": "3:38:11", "remaining_time": "14:47:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 610, "total_steps": 3080, "loss": 0.2791, "learning_rate": 9.412607883931608e-06, "epoch": 0.3959110822651306, "percentage": 19.81, "elapsed_time": "3:38:50", "remaining_time": "14:46:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 612, "total_steps": 3080, "loss": 0.2994, "learning_rate": 9.407548490769747e-06, "epoch": 0.3972091513873114, "percentage": 19.87, "elapsed_time": "3:39:30", "remaining_time": "14:45:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 614, "total_steps": 3080, "loss": 0.297, "learning_rate": 9.402468773662217e-06, "epoch": 0.3985072205094921, "percentage": 19.94, "elapsed_time": "3:40:14", "remaining_time": "14:44:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 616, "total_steps": 3080, "loss": 0.2588, "learning_rate": 9.397368756032445e-06, "epoch": 0.3998052896316729, "percentage": 20.0, "elapsed_time": "3:40:55", "remaining_time": "14:43:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 618, "total_steps": 3080, "loss": 0.3246, "learning_rate": 9.392248461397474e-06, "epoch": 0.40110335875385367, "percentage": 20.06, "elapsed_time": "3:41:35", "remaining_time": "14:42:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 620, "total_steps": 3080, "loss": 0.287, "learning_rate": 9.387107913367832e-06, "epoch": 0.4024014278760344, "percentage": 20.13, "elapsed_time": "3:42:19", "remaining_time": "14:42:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 622, "total_steps": 3080, "loss": 0.2933, "learning_rate": 9.381947135647457e-06, "epoch": 0.40369949699821517, "percentage": 20.19, "elapsed_time": "3:42:56", "remaining_time": "14:41:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 624, "total_steps": 3080, "loss": 0.2952, "learning_rate": 9.376766152033556e-06, "epoch": 0.4049975661203959, "percentage": 20.26, "elapsed_time": "3:43:33", "remaining_time": "14:39:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 626, "total_steps": 3080, "loss": 0.2924, "learning_rate": 9.371564986416517e-06, "epoch": 0.40629563524257667, "percentage": 20.32, "elapsed_time": "3:44:12", "remaining_time": "14:38:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 628, "total_steps": 3080, "loss": 0.3222, "learning_rate": 9.366343662779784e-06, "epoch": 0.40759370436475745, "percentage": 20.39, "elapsed_time": "3:44:56", "remaining_time": "14:38:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 630, "total_steps": 3080, "loss": 0.2939, "learning_rate": 9.361102205199762e-06, "epoch": 0.40889177348693817, "percentage": 20.45, "elapsed_time": "3:45:35", "remaining_time": "14:37:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 632, "total_steps": 3080, "loss": 0.2995, "learning_rate": 9.355840637845683e-06, "epoch": 0.41018984260911895, "percentage": 20.52, "elapsed_time": "3:46:14", "remaining_time": "14:36:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 634, "total_steps": 3080, "loss": 0.2967, "learning_rate": 9.350558984979525e-06, "epoch": 0.41148791173129967, "percentage": 20.58, "elapsed_time": "3:46:54", "remaining_time": "14:35:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 636, "total_steps": 3080, "loss": 0.282, "learning_rate": 9.345257270955873e-06, "epoch": 0.41278598085348045, "percentage": 20.65, "elapsed_time": "3:47:35", "remaining_time": "14:34:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 638, "total_steps": 3080, "loss": 0.3083, "learning_rate": 9.339935520221816e-06, "epoch": 0.41408404997566123, "percentage": 20.71, "elapsed_time": "3:48:13", "remaining_time": "14:33:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 640, "total_steps": 3080, "loss": 0.2792, "learning_rate": 9.334593757316845e-06, "epoch": 0.41538211909784195, "percentage": 20.78, "elapsed_time": "3:48:52", "remaining_time": "14:32:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 642, "total_steps": 3080, "loss": 0.284, "learning_rate": 9.329232006872722e-06, "epoch": 0.41668018822002273, "percentage": 20.84, "elapsed_time": "3:49:36", "remaining_time": "14:31:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 644, "total_steps": 3080, "loss": 0.2859, "learning_rate": 9.32385029361338e-06, "epoch": 0.41797825734220345, "percentage": 20.91, "elapsed_time": "3:50:15", "remaining_time": "14:30:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 646, "total_steps": 3080, "loss": 0.2723, "learning_rate": 9.3184486423548e-06, "epoch": 0.41927632646438423, "percentage": 20.97, "elapsed_time": "3:50:58", "remaining_time": "14:30:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 648, "total_steps": 3080, "loss": 0.295, "learning_rate": 9.313027078004903e-06, "epoch": 0.420574395586565, "percentage": 21.04, "elapsed_time": "3:51:35", "remaining_time": "14:29:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 650, "total_steps": 3080, "loss": 0.2872, "learning_rate": 9.307585625563433e-06, "epoch": 0.42187246470874573, "percentage": 21.1, "elapsed_time": "3:52:17", "remaining_time": "14:28:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 652, "total_steps": 3080, "loss": 0.2861, "learning_rate": 9.302124310121841e-06, "epoch": 0.4231705338309265, "percentage": 21.17, "elapsed_time": "3:52:59", "remaining_time": "14:27:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 654, "total_steps": 3080, "loss": 0.3013, "learning_rate": 9.296643156863166e-06, "epoch": 0.42446860295310723, "percentage": 21.23, "elapsed_time": "3:53:41", "remaining_time": "14:26:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 656, "total_steps": 3080, "loss": 0.3177, "learning_rate": 9.291142191061927e-06, "epoch": 0.425766672075288, "percentage": 21.3, "elapsed_time": "3:54:25", "remaining_time": "14:26:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 658, "total_steps": 3080, "loss": 0.2829, "learning_rate": 9.285621438083997e-06, "epoch": 0.4270647411974688, "percentage": 21.36, "elapsed_time": "3:55:03", "remaining_time": "14:25:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 660, "total_steps": 3080, "loss": 0.2986, "learning_rate": 9.280080923386501e-06, "epoch": 0.4283628103196495, "percentage": 21.43, "elapsed_time": "3:55:44", "remaining_time": "14:24:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 662, "total_steps": 3080, "loss": 0.2947, "learning_rate": 9.274520672517677e-06, "epoch": 0.4296608794418303, "percentage": 21.49, "elapsed_time": "3:56:24", "remaining_time": "14:23:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 664, "total_steps": 3080, "loss": 0.2677, "learning_rate": 9.268940711116776e-06, "epoch": 0.430958948564011, "percentage": 21.56, "elapsed_time": "3:57:05", "remaining_time": "14:22:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 666, "total_steps": 3080, "loss": 0.3052, "learning_rate": 9.263341064913937e-06, "epoch": 0.4322570176861918, "percentage": 21.62, "elapsed_time": "3:57:44", "remaining_time": "14:21:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 668, "total_steps": 3080, "loss": 0.3171, "learning_rate": 9.25772175973007e-06, "epoch": 0.43355508680837257, "percentage": 21.69, "elapsed_time": "3:58:23", "remaining_time": "14:20:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 670, "total_steps": 3080, "loss": 0.305, "learning_rate": 9.252082821476728e-06, "epoch": 0.4348531559305533, "percentage": 21.75, "elapsed_time": "3:59:02", "remaining_time": "14:19:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 672, "total_steps": 3080, "loss": 0.3126, "learning_rate": 9.246424276156008e-06, "epoch": 0.43615122505273407, "percentage": 21.82, "elapsed_time": "3:59:43", "remaining_time": "14:18:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 674, "total_steps": 3080, "loss": 0.3076, "learning_rate": 9.240746149860408e-06, "epoch": 0.4374492941749148, "percentage": 21.88, "elapsed_time": "4:00:22", "remaining_time": "14:18:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 676, "total_steps": 3080, "loss": 0.3021, "learning_rate": 9.235048468772722e-06, "epoch": 0.43874736329709557, "percentage": 21.95, "elapsed_time": "4:01:04", "remaining_time": "14:17:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 678, "total_steps": 3080, "loss": 0.2747, "learning_rate": 9.229331259165915e-06, "epoch": 0.44004543241927635, "percentage": 22.01, "elapsed_time": "4:01:43", "remaining_time": "14:16:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 680, "total_steps": 3080, "loss": 0.3215, "learning_rate": 9.223594547402999e-06, "epoch": 0.4413435015414571, "percentage": 22.08, "elapsed_time": "4:02:27", "remaining_time": "14:15:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 682, "total_steps": 3080, "loss": 0.3159, "learning_rate": 9.217838359936914e-06, "epoch": 0.44264157066363785, "percentage": 22.14, "elapsed_time": "4:03:06", "remaining_time": "14:14:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 684, "total_steps": 3080, "loss": 0.3087, "learning_rate": 9.212062723310406e-06, "epoch": 0.4439396397858186, "percentage": 22.21, "elapsed_time": "4:03:45", "remaining_time": "14:13:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 686, "total_steps": 3080, "loss": 0.3177, "learning_rate": 9.206267664155906e-06, "epoch": 0.44523770890799935, "percentage": 22.27, "elapsed_time": "4:04:28", "remaining_time": "14:13:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 688, "total_steps": 3080, "loss": 0.2782, "learning_rate": 9.200453209195404e-06, "epoch": 0.44653577803018013, "percentage": 22.34, "elapsed_time": "4:05:13", "remaining_time": "14:12:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 690, "total_steps": 3080, "loss": 0.2784, "learning_rate": 9.194619385240327e-06, "epoch": 0.44783384715236085, "percentage": 22.4, "elapsed_time": "4:05:54", "remaining_time": "14:11:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 692, "total_steps": 3080, "loss": 0.2988, "learning_rate": 9.188766219191415e-06, "epoch": 0.44913191627454163, "percentage": 22.47, "elapsed_time": "4:06:35", "remaining_time": "14:10:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 694, "total_steps": 3080, "loss": 0.3265, "learning_rate": 9.1828937380386e-06, "epoch": 0.45042998539672235, "percentage": 22.53, "elapsed_time": "4:07:17", "remaining_time": "14:10:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 696, "total_steps": 3080, "loss": 0.3075, "learning_rate": 9.177001968860878e-06, "epoch": 0.45172805451890313, "percentage": 22.6, "elapsed_time": "4:07:57", "remaining_time": "14:09:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 698, "total_steps": 3080, "loss": 0.3307, "learning_rate": 9.171090938826184e-06, "epoch": 0.4530261236410839, "percentage": 22.66, "elapsed_time": "4:08:35", "remaining_time": "14:08:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 700, "total_steps": 3080, "loss": 0.2801, "learning_rate": 9.165160675191272e-06, "epoch": 0.45432419276326463, "percentage": 22.73, "elapsed_time": "4:09:15", "remaining_time": "14:07:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 702, "total_steps": 3080, "loss": 0.2961, "learning_rate": 9.159211205301581e-06, "epoch": 0.4556222618854454, "percentage": 22.79, "elapsed_time": "4:09:58", "remaining_time": "14:06:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 704, "total_steps": 3080, "loss": 0.3057, "learning_rate": 9.153242556591115e-06, "epoch": 0.45692033100762613, "percentage": 22.86, "elapsed_time": "4:10:39", "remaining_time": "14:05:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 706, "total_steps": 3080, "loss": 0.2584, "learning_rate": 9.147254756582316e-06, "epoch": 0.4582184001298069, "percentage": 22.92, "elapsed_time": "4:11:24", "remaining_time": "14:05:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 708, "total_steps": 3080, "loss": 0.2691, "learning_rate": 9.141247832885932e-06, "epoch": 0.4595164692519877, "percentage": 22.99, "elapsed_time": "4:12:03", "remaining_time": "14:04:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 710, "total_steps": 3080, "loss": 0.3022, "learning_rate": 9.135221813200899e-06, "epoch": 0.4608145383741684, "percentage": 23.05, "elapsed_time": "4:12:43", "remaining_time": "14:03:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 712, "total_steps": 3080, "loss": 0.2825, "learning_rate": 9.129176725314201e-06, "epoch": 0.4621126074963492, "percentage": 23.12, "elapsed_time": "4:13:21", "remaining_time": "14:02:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 714, "total_steps": 3080, "loss": 0.2914, "learning_rate": 9.123112597100759e-06, "epoch": 0.4634106766185299, "percentage": 23.18, "elapsed_time": "4:14:01", "remaining_time": "14:01:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 716, "total_steps": 3080, "loss": 0.3066, "learning_rate": 9.11702945652328e-06, "epoch": 0.4647087457407107, "percentage": 23.25, "elapsed_time": "4:14:43", "remaining_time": "14:00:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 718, "total_steps": 3080, "loss": 0.2905, "learning_rate": 9.110927331632147e-06, "epoch": 0.46600681486289147, "percentage": 23.31, "elapsed_time": "4:15:23", "remaining_time": "14:00:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 720, "total_steps": 3080, "loss": 0.2946, "learning_rate": 9.104806250565283e-06, "epoch": 0.4673048839850722, "percentage": 23.38, "elapsed_time": "4:16:06", "remaining_time": "13:59:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 722, "total_steps": 3080, "loss": 0.2728, "learning_rate": 9.09866624154802e-06, "epoch": 0.468602953107253, "percentage": 23.44, "elapsed_time": "4:16:42", "remaining_time": "13:58:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 724, "total_steps": 3080, "loss": 0.2841, "learning_rate": 9.092507332892968e-06, "epoch": 0.4699010222294337, "percentage": 23.51, "elapsed_time": "4:17:27", "remaining_time": "13:57:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 726, "total_steps": 3080, "loss": 0.3182, "learning_rate": 9.08632955299989e-06, "epoch": 0.4711990913516145, "percentage": 23.57, "elapsed_time": "4:18:09", "remaining_time": "13:57:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 728, "total_steps": 3080, "loss": 0.2837, "learning_rate": 9.080132930355567e-06, "epoch": 0.47249716047379525, "percentage": 23.64, "elapsed_time": "4:18:47", "remaining_time": "13:56:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 730, "total_steps": 3080, "loss": 0.3008, "learning_rate": 9.073917493533663e-06, "epoch": 0.473795229595976, "percentage": 23.7, "elapsed_time": "4:19:31", "remaining_time": "13:55:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 732, "total_steps": 3080, "loss": 0.3431, "learning_rate": 9.067683271194601e-06, "epoch": 0.47509329871815675, "percentage": 23.77, "elapsed_time": "4:20:15", "remaining_time": "13:54:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 734, "total_steps": 3080, "loss": 0.2805, "learning_rate": 9.061430292085427e-06, "epoch": 0.4763913678403375, "percentage": 23.83, "elapsed_time": "4:20:53", "remaining_time": "13:53:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 736, "total_steps": 3080, "loss": 0.2846, "learning_rate": 9.055158585039678e-06, "epoch": 0.47768943696251825, "percentage": 23.9, "elapsed_time": "4:21:34", "remaining_time": "13:53:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 738, "total_steps": 3080, "loss": 0.2999, "learning_rate": 9.048868178977243e-06, "epoch": 0.47898750608469903, "percentage": 23.96, "elapsed_time": "4:22:13", "remaining_time": "13:52:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 740, "total_steps": 3080, "loss": 0.2805, "learning_rate": 9.042559102904245e-06, "epoch": 0.48028557520687976, "percentage": 24.03, "elapsed_time": "4:22:49", "remaining_time": "13:51:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 742, "total_steps": 3080, "loss": 0.3026, "learning_rate": 9.03623138591289e-06, "epoch": 0.48158364432906053, "percentage": 24.09, "elapsed_time": "4:23:30", "remaining_time": "13:50:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 744, "total_steps": 3080, "loss": 0.3116, "learning_rate": 9.029885057181343e-06, "epoch": 0.48288171345124126, "percentage": 24.16, "elapsed_time": "4:24:09", "remaining_time": "13:49:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 746, "total_steps": 3080, "loss": 0.2937, "learning_rate": 9.02352014597359e-06, "epoch": 0.48417978257342204, "percentage": 24.22, "elapsed_time": "4:24:49", "remaining_time": "13:48:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 748, "total_steps": 3080, "loss": 0.3046, "learning_rate": 9.017136681639307e-06, "epoch": 0.4854778516956028, "percentage": 24.29, "elapsed_time": "4:25:28", "remaining_time": "13:47:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 750, "total_steps": 3080, "loss": 0.3044, "learning_rate": 9.010734693613716e-06, "epoch": 0.48677592081778354, "percentage": 24.35, "elapsed_time": "4:26:06", "remaining_time": "13:46:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 752, "total_steps": 3080, "loss": 0.2967, "learning_rate": 9.004314211417461e-06, "epoch": 0.4880739899399643, "percentage": 24.42, "elapsed_time": "4:26:50", "remaining_time": "13:46:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 754, "total_steps": 3080, "loss": 0.3033, "learning_rate": 8.997875264656461e-06, "epoch": 0.48937205906214504, "percentage": 24.48, "elapsed_time": "4:27:28", "remaining_time": "13:45:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 756, "total_steps": 3080, "loss": 0.2839, "learning_rate": 8.99141788302178e-06, "epoch": 0.4906701281843258, "percentage": 24.55, "elapsed_time": "4:28:07", "remaining_time": "13:44:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 758, "total_steps": 3080, "loss": 0.3279, "learning_rate": 8.984942096289488e-06, "epoch": 0.4919681973065066, "percentage": 24.61, "elapsed_time": "4:28:46", "remaining_time": "13:43:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 760, "total_steps": 3080, "loss": 0.3044, "learning_rate": 8.978447934320526e-06, "epoch": 0.4932662664286873, "percentage": 24.68, "elapsed_time": "4:29:27", "remaining_time": "13:42:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 762, "total_steps": 3080, "loss": 0.2866, "learning_rate": 8.971935427060563e-06, "epoch": 0.4945643355508681, "percentage": 24.74, "elapsed_time": "4:30:07", "remaining_time": "13:41:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 764, "total_steps": 3080, "loss": 0.2932, "learning_rate": 8.965404604539864e-06, "epoch": 0.4958624046730488, "percentage": 24.81, "elapsed_time": "4:30:46", "remaining_time": "13:40:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 766, "total_steps": 3080, "loss": 0.2916, "learning_rate": 8.958855496873146e-06, "epoch": 0.4971604737952296, "percentage": 24.87, "elapsed_time": "4:31:27", "remaining_time": "13:40:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 768, "total_steps": 3080, "loss": 0.2877, "learning_rate": 8.952288134259443e-06, "epoch": 0.4984585429174104, "percentage": 24.94, "elapsed_time": "4:32:03", "remaining_time": "13:38:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 770, "total_steps": 3080, "loss": 0.303, "learning_rate": 8.94570254698197e-06, "epoch": 0.4997566120395911, "percentage": 25.0, "elapsed_time": "4:32:43", "remaining_time": "13:38:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 772, "total_steps": 3080, "loss": 0.2766, "learning_rate": 8.93909876540797e-06, "epoch": 0.5010546811617719, "percentage": 25.06, "elapsed_time": "4:33:23", "remaining_time": "13:37:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 774, "total_steps": 3080, "loss": 0.284, "learning_rate": 8.932476819988589e-06, "epoch": 0.5023527502839527, "percentage": 25.13, "elapsed_time": "4:34:05", "remaining_time": "13:36:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 776, "total_steps": 3080, "loss": 0.2824, "learning_rate": 8.925836741258729e-06, "epoch": 0.5036508194061334, "percentage": 25.19, "elapsed_time": "4:34:46", "remaining_time": "13:35:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 778, "total_steps": 3080, "loss": 0.2844, "learning_rate": 8.91917855983691e-06, "epoch": 0.5049488885283141, "percentage": 25.26, "elapsed_time": "4:35:22", "remaining_time": "13:34:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 780, "total_steps": 3080, "loss": 0.289, "learning_rate": 8.912502306425121e-06, "epoch": 0.5062469576504949, "percentage": 25.32, "elapsed_time": "4:36:00", "remaining_time": "13:33:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 782, "total_steps": 3080, "loss": 0.2956, "learning_rate": 8.905808011808685e-06, "epoch": 0.5075450267726757, "percentage": 25.39, "elapsed_time": "4:36:38", "remaining_time": "13:32:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 784, "total_steps": 3080, "loss": 0.3098, "learning_rate": 8.899095706856122e-06, "epoch": 0.5088430958948564, "percentage": 25.45, "elapsed_time": "4:37:17", "remaining_time": "13:32:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 786, "total_steps": 3080, "loss": 0.2717, "learning_rate": 8.892365422518995e-06, "epoch": 0.5101411650170372, "percentage": 25.52, "elapsed_time": "4:37:55", "remaining_time": "13:31:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 788, "total_steps": 3080, "loss": 0.284, "learning_rate": 8.885617189831772e-06, "epoch": 0.5114392341392179, "percentage": 25.58, "elapsed_time": "4:38:35", "remaining_time": "13:30:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 790, "total_steps": 3080, "loss": 0.2807, "learning_rate": 8.87885103991169e-06, "epoch": 0.5127373032613987, "percentage": 25.65, "elapsed_time": "4:39:14", "remaining_time": "13:29:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 792, "total_steps": 3080, "loss": 0.3047, "learning_rate": 8.872067003958597e-06, "epoch": 0.5140353723835794, "percentage": 25.71, "elapsed_time": "4:39:55", "remaining_time": "13:28:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 794, "total_steps": 3080, "loss": 0.3228, "learning_rate": 8.865265113254826e-06, "epoch": 0.5153334415057602, "percentage": 25.78, "elapsed_time": "4:40:33", "remaining_time": "13:27:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 796, "total_steps": 3080, "loss": 0.286, "learning_rate": 8.858445399165033e-06, "epoch": 0.516631510627941, "percentage": 25.84, "elapsed_time": "4:41:13", "remaining_time": "13:26:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 798, "total_steps": 3080, "loss": 0.2698, "learning_rate": 8.851607893136065e-06, "epoch": 0.5179295797501217, "percentage": 25.91, "elapsed_time": "4:41:54", "remaining_time": "13:26:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 800, "total_steps": 3080, "loss": 0.2875, "learning_rate": 8.84475262669681e-06, "epoch": 0.5192276488723024, "percentage": 25.97, "elapsed_time": "4:42:33", "remaining_time": "13:25:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 802, "total_steps": 3080, "loss": 0.3084, "learning_rate": 8.837879631458053e-06, "epoch": 0.5205257179944832, "percentage": 26.04, "elapsed_time": "4:43:16", "remaining_time": "13:24:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 804, "total_steps": 3080, "loss": 0.2895, "learning_rate": 8.830988939112326e-06, "epoch": 0.521823787116664, "percentage": 26.1, "elapsed_time": "4:43:57", "remaining_time": "13:23:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 806, "total_steps": 3080, "loss": 0.2592, "learning_rate": 8.824080581433769e-06, "epoch": 0.5231218562388448, "percentage": 26.17, "elapsed_time": "4:44:38", "remaining_time": "13:23:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 808, "total_steps": 3080, "loss": 0.2771, "learning_rate": 8.817154590277976e-06, "epoch": 0.5244199253610254, "percentage": 26.23, "elapsed_time": "4:45:20", "remaining_time": "13:22:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 810, "total_steps": 3080, "loss": 0.2726, "learning_rate": 8.810210997581859e-06, "epoch": 0.5257179944832062, "percentage": 26.3, "elapsed_time": "4:46:02", "remaining_time": "13:21:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 812, "total_steps": 3080, "loss": 0.3111, "learning_rate": 8.803249835363486e-06, "epoch": 0.527016063605387, "percentage": 26.36, "elapsed_time": "4:46:42", "remaining_time": "13:20:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 814, "total_steps": 3080, "loss": 0.294, "learning_rate": 8.796271135721944e-06, "epoch": 0.5283141327275678, "percentage": 26.43, "elapsed_time": "4:47:25", "remaining_time": "13:20:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 816, "total_steps": 3080, "loss": 0.2836, "learning_rate": 8.789274930837189e-06, "epoch": 0.5296122018497486, "percentage": 26.49, "elapsed_time": "4:48:06", "remaining_time": "13:19:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 818, "total_steps": 3080, "loss": 0.2853, "learning_rate": 8.782261252969895e-06, "epoch": 0.5309102709719292, "percentage": 26.56, "elapsed_time": "4:48:45", "remaining_time": "13:18:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 820, "total_steps": 3080, "loss": 0.3105, "learning_rate": 8.775230134461307e-06, "epoch": 0.53220834009411, "percentage": 26.62, "elapsed_time": "4:49:28", "remaining_time": "13:17:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 822, "total_steps": 3080, "loss": 0.2888, "learning_rate": 8.768181607733095e-06, "epoch": 0.5335064092162908, "percentage": 26.69, "elapsed_time": "4:50:07", "remaining_time": "13:16:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 824, "total_steps": 3080, "loss": 0.2872, "learning_rate": 8.761115705287195e-06, "epoch": 0.5348044783384716, "percentage": 26.75, "elapsed_time": "4:50:53", "remaining_time": "13:16:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 826, "total_steps": 3080, "loss": 0.2748, "learning_rate": 8.754032459705672e-06, "epoch": 0.5361025474606523, "percentage": 26.82, "elapsed_time": "4:51:34", "remaining_time": "13:15:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 828, "total_steps": 3080, "loss": 0.275, "learning_rate": 8.746931903650558e-06, "epoch": 0.537400616582833, "percentage": 26.88, "elapsed_time": "4:52:16", "remaining_time": "13:14:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 830, "total_steps": 3080, "loss": 0.2818, "learning_rate": 8.739814069863708e-06, "epoch": 0.5386986857050138, "percentage": 26.95, "elapsed_time": "4:52:57", "remaining_time": "13:14:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 832, "total_steps": 3080, "loss": 0.2827, "learning_rate": 8.732678991166647e-06, "epoch": 0.5399967548271946, "percentage": 27.01, "elapsed_time": "4:53:36", "remaining_time": "13:13:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 834, "total_steps": 3080, "loss": 0.2972, "learning_rate": 8.725526700460426e-06, "epoch": 0.5412948239493753, "percentage": 27.08, "elapsed_time": "4:54:19", "remaining_time": "13:12:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 836, "total_steps": 3080, "loss": 0.2896, "learning_rate": 8.71835723072545e-06, "epoch": 0.5425928930715561, "percentage": 27.14, "elapsed_time": "4:54:56", "remaining_time": "13:11:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 838, "total_steps": 3080, "loss": 0.3427, "learning_rate": 8.71117061502135e-06, "epoch": 0.5438909621937368, "percentage": 27.21, "elapsed_time": "4:55:36", "remaining_time": "13:10:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 840, "total_steps": 3080, "loss": 0.2943, "learning_rate": 8.703966886486819e-06, "epoch": 0.5451890313159176, "percentage": 27.27, "elapsed_time": "4:56:15", "remaining_time": "13:10:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 842, "total_steps": 3080, "loss": 0.2923, "learning_rate": 8.696746078339455e-06, "epoch": 0.5464871004380983, "percentage": 27.34, "elapsed_time": "4:56:54", "remaining_time": "13:09:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 844, "total_steps": 3080, "loss": 0.2812, "learning_rate": 8.68950822387562e-06, "epoch": 0.5477851695602791, "percentage": 27.4, "elapsed_time": "4:57:30", "remaining_time": "13:08:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 846, "total_steps": 3080, "loss": 0.2878, "learning_rate": 8.68225335647027e-06, "epoch": 0.5490832386824599, "percentage": 27.47, "elapsed_time": "4:58:12", "remaining_time": "13:07:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 848, "total_steps": 3080, "loss": 0.3083, "learning_rate": 8.674981509576819e-06, "epoch": 0.5503813078046406, "percentage": 27.53, "elapsed_time": "4:58:50", "remaining_time": "13:06:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 850, "total_steps": 3080, "loss": 0.2929, "learning_rate": 8.667692716726974e-06, "epoch": 0.5516793769268213, "percentage": 27.6, "elapsed_time": "4:59:28", "remaining_time": "13:05:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 852, "total_steps": 3080, "loss": 0.292, "learning_rate": 8.66038701153058e-06, "epoch": 0.5529774460490021, "percentage": 27.66, "elapsed_time": "5:00:10", "remaining_time": "13:04:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 854, "total_steps": 3080, "loss": 0.3135, "learning_rate": 8.65306442767547e-06, "epoch": 0.5542755151711829, "percentage": 27.73, "elapsed_time": "5:00:51", "remaining_time": "13:04:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 856, "total_steps": 3080, "loss": 0.3071, "learning_rate": 8.64572499892731e-06, "epoch": 0.5555735842933637, "percentage": 27.79, "elapsed_time": "5:01:33", "remaining_time": "13:03:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 858, "total_steps": 3080, "loss": 0.2722, "learning_rate": 8.638368759129433e-06, "epoch": 0.5568716534155443, "percentage": 27.86, "elapsed_time": "5:02:11", "remaining_time": "13:02:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 860, "total_steps": 3080, "loss": 0.2919, "learning_rate": 8.630995742202695e-06, "epoch": 0.5581697225377251, "percentage": 27.92, "elapsed_time": "5:02:52", "remaining_time": "13:01:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 862, "total_steps": 3080, "loss": 0.27, "learning_rate": 8.623605982145318e-06, "epoch": 0.5594677916599059, "percentage": 27.99, "elapsed_time": "5:03:35", "remaining_time": "13:01:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 864, "total_steps": 3080, "loss": 0.2926, "learning_rate": 8.616199513032723e-06, "epoch": 0.5607658607820867, "percentage": 28.05, "elapsed_time": "5:04:15", "remaining_time": "13:00:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 866, "total_steps": 3080, "loss": 0.2993, "learning_rate": 8.608776369017382e-06, "epoch": 0.5620639299042675, "percentage": 28.12, "elapsed_time": "5:04:56", "remaining_time": "12:59:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 868, "total_steps": 3080, "loss": 0.2817, "learning_rate": 8.601336584328659e-06, "epoch": 0.5633619990264481, "percentage": 28.18, "elapsed_time": "5:05:37", "remaining_time": "12:58:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 870, "total_steps": 3080, "loss": 0.3029, "learning_rate": 8.593880193272649e-06, "epoch": 0.5646600681486289, "percentage": 28.25, "elapsed_time": "5:06:19", "remaining_time": "12:58:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 872, "total_steps": 3080, "loss": 0.3101, "learning_rate": 8.58640723023202e-06, "epoch": 0.5659581372708097, "percentage": 28.31, "elapsed_time": "5:06:59", "remaining_time": "12:57:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 874, "total_steps": 3080, "loss": 0.2947, "learning_rate": 8.578917729665863e-06, "epoch": 0.5672562063929905, "percentage": 28.38, "elapsed_time": "5:07:39", "remaining_time": "12:56:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 876, "total_steps": 3080, "loss": 0.2869, "learning_rate": 8.571411726109518e-06, "epoch": 0.5685542755151712, "percentage": 28.44, "elapsed_time": "5:08:18", "remaining_time": "12:55:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 878, "total_steps": 3080, "loss": 0.3198, "learning_rate": 8.563889254174429e-06, "epoch": 0.5698523446373519, "percentage": 28.51, "elapsed_time": "5:09:01", "remaining_time": "12:55:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 880, "total_steps": 3080, "loss": 0.3014, "learning_rate": 8.556350348547978e-06, "epoch": 0.5711504137595327, "percentage": 28.57, "elapsed_time": "5:09:40", "remaining_time": "12:54:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 882, "total_steps": 3080, "loss": 0.302, "learning_rate": 8.548795043993316e-06, "epoch": 0.5724484828817135, "percentage": 28.64, "elapsed_time": "5:10:18", "remaining_time": "12:53:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 884, "total_steps": 3080, "loss": 0.2879, "learning_rate": 8.54122337534923e-06, "epoch": 0.5737465520038942, "percentage": 28.7, "elapsed_time": "5:10:59", "remaining_time": "12:52:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 886, "total_steps": 3080, "loss": 0.2969, "learning_rate": 8.533635377529949e-06, "epoch": 0.575044621126075, "percentage": 28.77, "elapsed_time": "5:11:41", "remaining_time": "12:51:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 888, "total_steps": 3080, "loss": 0.3158, "learning_rate": 8.526031085525004e-06, "epoch": 0.5763426902482557, "percentage": 28.83, "elapsed_time": "5:12:18", "remaining_time": "12:50:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 890, "total_steps": 3080, "loss": 0.2846, "learning_rate": 8.518410534399063e-06, "epoch": 0.5776407593704365, "percentage": 28.9, "elapsed_time": "5:12:58", "remaining_time": "12:50:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 892, "total_steps": 3080, "loss": 0.2806, "learning_rate": 8.510773759291768e-06, "epoch": 0.5789388284926172, "percentage": 28.96, "elapsed_time": "5:13:36", "remaining_time": "12:49:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 894, "total_steps": 3080, "loss": 0.2829, "learning_rate": 8.503120795417568e-06, "epoch": 0.580236897614798, "percentage": 29.03, "elapsed_time": "5:14:15", "remaining_time": "12:48:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 896, "total_steps": 3080, "loss": 0.3033, "learning_rate": 8.495451678065563e-06, "epoch": 0.5815349667369788, "percentage": 29.09, "elapsed_time": "5:15:01", "remaining_time": "12:47:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 898, "total_steps": 3080, "loss": 0.2656, "learning_rate": 8.487766442599339e-06, "epoch": 0.5828330358591595, "percentage": 29.16, "elapsed_time": "5:15:44", "remaining_time": "12:47:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 900, "total_steps": 3080, "loss": 0.2883, "learning_rate": 8.48006512445681e-06, "epoch": 0.5841311049813402, "percentage": 29.22, "elapsed_time": "5:16:25", "remaining_time": "12:46:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 902, "total_steps": 3080, "loss": 0.269, "learning_rate": 8.472347759150044e-06, "epoch": 0.585429174103521, "percentage": 29.29, "elapsed_time": "5:17:04", "remaining_time": "12:45:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 904, "total_steps": 3080, "loss": 0.3032, "learning_rate": 8.464614382265107e-06, "epoch": 0.5867272432257018, "percentage": 29.35, "elapsed_time": "5:17:47", "remaining_time": "12:44:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 906, "total_steps": 3080, "loss": 0.303, "learning_rate": 8.4568650294619e-06, "epoch": 0.5880253123478826, "percentage": 29.42, "elapsed_time": "5:18:24", "remaining_time": "12:44:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 908, "total_steps": 3080, "loss": 0.3056, "learning_rate": 8.449099736473986e-06, "epoch": 0.5893233814700632, "percentage": 29.48, "elapsed_time": "5:19:01", "remaining_time": "12:43:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 910, "total_steps": 3080, "loss": 0.3327, "learning_rate": 8.441318539108433e-06, "epoch": 0.590621450592244, "percentage": 29.55, "elapsed_time": "5:19:42", "remaining_time": "12:42:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 912, "total_steps": 3080, "loss": 0.2803, "learning_rate": 8.433521473245653e-06, "epoch": 0.5919195197144248, "percentage": 29.61, "elapsed_time": "5:20:23", "remaining_time": "12:41:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 914, "total_steps": 3080, "loss": 0.306, "learning_rate": 8.425708574839221e-06, "epoch": 0.5932175888366056, "percentage": 29.68, "elapsed_time": "5:21:02", "remaining_time": "12:40:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 916, "total_steps": 3080, "loss": 0.2743, "learning_rate": 8.417879879915724e-06, "epoch": 0.5945156579587864, "percentage": 29.74, "elapsed_time": "5:21:38", "remaining_time": "12:39:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 918, "total_steps": 3080, "loss": 0.3026, "learning_rate": 8.410035424574587e-06, "epoch": 0.595813727080967, "percentage": 29.81, "elapsed_time": "5:22:16", "remaining_time": "12:39:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 920, "total_steps": 3080, "loss": 0.3008, "learning_rate": 8.40217524498791e-06, "epoch": 0.5971117962031478, "percentage": 29.87, "elapsed_time": "5:22:56", "remaining_time": "12:38:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 922, "total_steps": 3080, "loss": 0.295, "learning_rate": 8.394299377400301e-06, "epoch": 0.5984098653253286, "percentage": 29.94, "elapsed_time": "5:23:39", "remaining_time": "12:37:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 924, "total_steps": 3080, "loss": 0.277, "learning_rate": 8.386407858128707e-06, "epoch": 0.5997079344475094, "percentage": 30.0, "elapsed_time": "5:24:17", "remaining_time": "12:36:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 926, "total_steps": 3080, "loss": 0.3059, "learning_rate": 8.378500723562243e-06, "epoch": 0.6010060035696901, "percentage": 30.06, "elapsed_time": "5:24:58", "remaining_time": "12:35:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 928, "total_steps": 3080, "loss": 0.2849, "learning_rate": 8.370578010162043e-06, "epoch": 0.6023040726918708, "percentage": 30.13, "elapsed_time": "5:25:38", "remaining_time": "12:35:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 930, "total_steps": 3080, "loss": 0.2743, "learning_rate": 8.362639754461057e-06, "epoch": 0.6036021418140516, "percentage": 30.19, "elapsed_time": "5:26:19", "remaining_time": "12:34:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 932, "total_steps": 3080, "loss": 0.3138, "learning_rate": 8.354685993063923e-06, "epoch": 0.6049002109362324, "percentage": 30.26, "elapsed_time": "5:27:02", "remaining_time": "12:33:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 934, "total_steps": 3080, "loss": 0.2959, "learning_rate": 8.346716762646763e-06, "epoch": 0.6061982800584131, "percentage": 30.32, "elapsed_time": "5:27:38", "remaining_time": "12:32:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 936, "total_steps": 3080, "loss": 0.2785, "learning_rate": 8.338732099957038e-06, "epoch": 0.6074963491805939, "percentage": 30.39, "elapsed_time": "5:28:20", "remaining_time": "12:32:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 938, "total_steps": 3080, "loss": 0.2939, "learning_rate": 8.330732041813367e-06, "epoch": 0.6087944183027746, "percentage": 30.45, "elapsed_time": "5:28:57", "remaining_time": "12:31:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 940, "total_steps": 3080, "loss": 0.2649, "learning_rate": 8.322716625105363e-06, "epoch": 0.6100924874249554, "percentage": 30.52, "elapsed_time": "5:29:34", "remaining_time": "12:30:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 942, "total_steps": 3080, "loss": 0.2782, "learning_rate": 8.314685886793456e-06, "epoch": 0.6113905565471361, "percentage": 30.58, "elapsed_time": "5:30:10", "remaining_time": "12:29:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 944, "total_steps": 3080, "loss": 0.2938, "learning_rate": 8.306639863908725e-06, "epoch": 0.6126886256693169, "percentage": 30.65, "elapsed_time": "5:30:51", "remaining_time": "12:28:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 946, "total_steps": 3080, "loss": 0.2734, "learning_rate": 8.298578593552737e-06, "epoch": 0.6139866947914977, "percentage": 30.71, "elapsed_time": "5:31:31", "remaining_time": "12:27:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 948, "total_steps": 3080, "loss": 0.3051, "learning_rate": 8.290502112897357e-06, "epoch": 0.6152847639136784, "percentage": 30.78, "elapsed_time": "5:32:17", "remaining_time": "12:27:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 950, "total_steps": 3080, "loss": 0.2907, "learning_rate": 8.282410459184597e-06, "epoch": 0.6165828330358591, "percentage": 30.84, "elapsed_time": "5:32:58", "remaining_time": "12:26:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 952, "total_steps": 3080, "loss": 0.2764, "learning_rate": 8.274303669726427e-06, "epoch": 0.6178809021580399, "percentage": 30.91, "elapsed_time": "5:33:36", "remaining_time": "12:25:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 954, "total_steps": 3080, "loss": 0.3078, "learning_rate": 8.266181781904613e-06, "epoch": 0.6191789712802207, "percentage": 30.97, "elapsed_time": "5:34:17", "remaining_time": "12:24:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 956, "total_steps": 3080, "loss": 0.2884, "learning_rate": 8.258044833170545e-06, "epoch": 0.6204770404024015, "percentage": 31.04, "elapsed_time": "5:34:57", "remaining_time": "12:24:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 958, "total_steps": 3080, "loss": 0.32, "learning_rate": 8.24989286104506e-06, "epoch": 0.6217751095245821, "percentage": 31.1, "elapsed_time": "5:35:36", "remaining_time": "12:23:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 960, "total_steps": 3080, "loss": 0.2941, "learning_rate": 8.241725903118264e-06, "epoch": 0.6230731786467629, "percentage": 31.17, "elapsed_time": "5:36:15", "remaining_time": "12:22:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 962, "total_steps": 3080, "loss": 0.2909, "learning_rate": 8.233543997049376e-06, "epoch": 0.6243712477689437, "percentage": 31.23, "elapsed_time": "5:36:59", "remaining_time": "12:21:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 964, "total_steps": 3080, "loss": 0.2879, "learning_rate": 8.225347180566534e-06, "epoch": 0.6256693168911245, "percentage": 31.3, "elapsed_time": "5:37:42", "remaining_time": "12:21:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 966, "total_steps": 3080, "loss": 0.2916, "learning_rate": 8.217135491466636e-06, "epoch": 0.6269673860133053, "percentage": 31.36, "elapsed_time": "5:38:20", "remaining_time": "12:20:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 968, "total_steps": 3080, "loss": 0.2712, "learning_rate": 8.208908967615159e-06, "epoch": 0.6282654551354859, "percentage": 31.43, "elapsed_time": "5:39:01", "remaining_time": "12:19:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 970, "total_steps": 3080, "loss": 0.289, "learning_rate": 8.200667646945983e-06, "epoch": 0.6295635242576667, "percentage": 31.49, "elapsed_time": "5:39:45", "remaining_time": "12:19:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 972, "total_steps": 3080, "loss": 0.3077, "learning_rate": 8.192411567461222e-06, "epoch": 0.6308615933798475, "percentage": 31.56, "elapsed_time": "5:40:34", "remaining_time": "12:18:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 974, "total_steps": 3080, "loss": 0.2742, "learning_rate": 8.184140767231044e-06, "epoch": 0.6321596625020283, "percentage": 31.62, "elapsed_time": "5:41:13", "remaining_time": "12:17:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 976, "total_steps": 3080, "loss": 0.266, "learning_rate": 8.175855284393495e-06, "epoch": 0.633457731624209, "percentage": 31.69, "elapsed_time": "5:41:53", "remaining_time": "12:17:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 978, "total_steps": 3080, "loss": 0.2756, "learning_rate": 8.167555157154327e-06, "epoch": 0.6347558007463897, "percentage": 31.75, "elapsed_time": "5:42:30", "remaining_time": "12:16:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 980, "total_steps": 3080, "loss": 0.289, "learning_rate": 8.15924042378682e-06, "epoch": 0.6360538698685705, "percentage": 31.82, "elapsed_time": "5:43:08", "remaining_time": "12:15:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 982, "total_steps": 3080, "loss": 0.302, "learning_rate": 8.150911122631606e-06, "epoch": 0.6373519389907513, "percentage": 31.88, "elapsed_time": "5:43:48", "remaining_time": "12:14:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 984, "total_steps": 3080, "loss": 0.2831, "learning_rate": 8.142567292096488e-06, "epoch": 0.638650008112932, "percentage": 31.95, "elapsed_time": "5:44:36", "remaining_time": "12:14:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 986, "total_steps": 3080, "loss": 0.2893, "learning_rate": 8.13420897065627e-06, "epoch": 0.6399480772351128, "percentage": 32.01, "elapsed_time": "5:45:21", "remaining_time": "12:13:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 988, "total_steps": 3080, "loss": 0.3004, "learning_rate": 8.125836196852577e-06, "epoch": 0.6412461463572935, "percentage": 32.08, "elapsed_time": "5:46:10", "remaining_time": "12:12:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 990, "total_steps": 3080, "loss": 0.3045, "learning_rate": 8.117449009293668e-06, "epoch": 0.6425442154794743, "percentage": 32.14, "elapsed_time": "5:46:51", "remaining_time": "12:12:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 992, "total_steps": 3080, "loss": 0.2833, "learning_rate": 8.109047446654276e-06, "epoch": 0.643842284601655, "percentage": 32.21, "elapsed_time": "5:47:31", "remaining_time": "12:11:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 994, "total_steps": 3080, "loss": 0.269, "learning_rate": 8.100631547675417e-06, "epoch": 0.6451403537238358, "percentage": 32.27, "elapsed_time": "5:48:12", "remaining_time": "12:10:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 996, "total_steps": 3080, "loss": 0.3091, "learning_rate": 8.092201351164213e-06, "epoch": 0.6464384228460166, "percentage": 32.34, "elapsed_time": "5:48:57", "remaining_time": "12:10:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 998, "total_steps": 3080, "loss": 0.2857, "learning_rate": 8.083756895993712e-06, "epoch": 0.6477364919681973, "percentage": 32.4, "elapsed_time": "5:49:38", "remaining_time": "12:09:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1000, "total_steps": 3080, "loss": 0.3026, "learning_rate": 8.075298221102714e-06, "epoch": 0.649034561090378, "percentage": 32.47, "elapsed_time": "5:50:17", "remaining_time": "12:08:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1000, "total_steps": 3080, "eval_loss": 0.29006972908973694, "epoch": 0.649034561090378, "percentage": 32.47, "elapsed_time": "6:04:06", "remaining_time": "12:37:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1002, "total_steps": 3080, "loss": 0.2813, "learning_rate": 8.066825365495591e-06, "epoch": 0.6503326302125588, "percentage": 32.53, "elapsed_time": "6:04:48", "remaining_time": "12:36:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1004, "total_steps": 3080, "loss": 0.2702, "learning_rate": 8.058338368242103e-06, "epoch": 0.6516306993347396, "percentage": 32.6, "elapsed_time": "6:05:28", "remaining_time": "12:35:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1006, "total_steps": 3080, "loss": 0.297, "learning_rate": 8.049837268477213e-06, "epoch": 0.6529287684569204, "percentage": 32.66, "elapsed_time": "6:06:04", "remaining_time": "12:34:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1008, "total_steps": 3080, "loss": 0.305, "learning_rate": 8.041322105400923e-06, "epoch": 0.654226837579101, "percentage": 32.73, "elapsed_time": "6:06:40", "remaining_time": "12:33:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1010, "total_steps": 3080, "loss": 0.2955, "learning_rate": 8.032792918278076e-06, "epoch": 0.6555249067012818, "percentage": 32.79, "elapsed_time": "6:07:18", "remaining_time": "12:32:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1012, "total_steps": 3080, "loss": 0.303, "learning_rate": 8.024249746438189e-06, "epoch": 0.6568229758234626, "percentage": 32.86, "elapsed_time": "6:07:55", "remaining_time": "12:31:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1014, "total_steps": 3080, "loss": 0.2898, "learning_rate": 8.015692629275256e-06, "epoch": 0.6581210449456434, "percentage": 32.92, "elapsed_time": "6:08:39", "remaining_time": "12:31:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1016, "total_steps": 3080, "loss": 0.2811, "learning_rate": 8.007121606247583e-06, "epoch": 0.6594191140678242, "percentage": 32.99, "elapsed_time": "6:09:18", "remaining_time": "12:30:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1018, "total_steps": 3080, "loss": 0.2968, "learning_rate": 7.998536716877593e-06, "epoch": 0.6607171831900048, "percentage": 33.05, "elapsed_time": "6:09:56", "remaining_time": "12:29:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1020, "total_steps": 3080, "loss": 0.3056, "learning_rate": 7.989938000751655e-06, "epoch": 0.6620152523121856, "percentage": 33.12, "elapsed_time": "6:10:37", "remaining_time": "12:28:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1022, "total_steps": 3080, "loss": 0.2927, "learning_rate": 7.981325497519892e-06, "epoch": 0.6633133214343664, "percentage": 33.18, "elapsed_time": "6:11:16", "remaining_time": "12:27:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1024, "total_steps": 3080, "loss": 0.2725, "learning_rate": 7.972699246895996e-06, "epoch": 0.6646113905565472, "percentage": 33.25, "elapsed_time": "6:11:54", "remaining_time": "12:26:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1026, "total_steps": 3080, "loss": 0.2711, "learning_rate": 7.964059288657061e-06, "epoch": 0.6659094596787279, "percentage": 33.31, "elapsed_time": "6:12:35", "remaining_time": "12:25:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1028, "total_steps": 3080, "loss": 0.3139, "learning_rate": 7.955405662643384e-06, "epoch": 0.6672075288009086, "percentage": 33.38, "elapsed_time": "6:13:15", "remaining_time": "12:25:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1030, "total_steps": 3080, "loss": 0.2636, "learning_rate": 7.946738408758283e-06, "epoch": 0.6685055979230894, "percentage": 33.44, "elapsed_time": "6:13:59", "remaining_time": "12:24:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1032, "total_steps": 3080, "loss": 0.3031, "learning_rate": 7.938057566967926e-06, "epoch": 0.6698036670452702, "percentage": 33.51, "elapsed_time": "6:14:40", "remaining_time": "12:23:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1034, "total_steps": 3080, "loss": 0.2623, "learning_rate": 7.929363177301124e-06, "epoch": 0.671101736167451, "percentage": 33.57, "elapsed_time": "6:15:18", "remaining_time": "12:22:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1036, "total_steps": 3080, "loss": 0.2624, "learning_rate": 7.920655279849173e-06, "epoch": 0.6723998052896317, "percentage": 33.64, "elapsed_time": "6:15:59", "remaining_time": "12:21:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1038, "total_steps": 3080, "loss": 0.2634, "learning_rate": 7.911933914765645e-06, "epoch": 0.6736978744118124, "percentage": 33.7, "elapsed_time": "6:16:40", "remaining_time": "12:21:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1040, "total_steps": 3080, "loss": 0.2734, "learning_rate": 7.90319912226622e-06, "epoch": 0.6749959435339932, "percentage": 33.77, "elapsed_time": "6:17:18", "remaining_time": "12:20:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1042, "total_steps": 3080, "loss": 0.3134, "learning_rate": 7.894450942628491e-06, "epoch": 0.676294012656174, "percentage": 33.83, "elapsed_time": "6:18:01", "remaining_time": "12:19:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1044, "total_steps": 3080, "loss": 0.3776, "learning_rate": 7.885689416191785e-06, "epoch": 0.6775920817783547, "percentage": 33.9, "elapsed_time": "6:18:44", "remaining_time": "12:18:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1046, "total_steps": 3080, "loss": 0.2825, "learning_rate": 7.876914583356965e-06, "epoch": 0.6788901509005355, "percentage": 33.96, "elapsed_time": "6:19:25", "remaining_time": "12:17:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1048, "total_steps": 3080, "loss": 0.2897, "learning_rate": 7.868126484586261e-06, "epoch": 0.6801882200227162, "percentage": 34.03, "elapsed_time": "6:20:05", "remaining_time": "12:16:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1050, "total_steps": 3080, "loss": 0.304, "learning_rate": 7.859325160403073e-06, "epoch": 0.681486289144897, "percentage": 34.09, "elapsed_time": "6:20:44", "remaining_time": "12:16:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1052, "total_steps": 3080, "loss": 0.3055, "learning_rate": 7.850510651391778e-06, "epoch": 0.6827843582670777, "percentage": 34.16, "elapsed_time": "6:21:24", "remaining_time": "12:15:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1054, "total_steps": 3080, "loss": 0.2995, "learning_rate": 7.841682998197561e-06, "epoch": 0.6840824273892585, "percentage": 34.22, "elapsed_time": "6:22:06", "remaining_time": "12:14:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1056, "total_steps": 3080, "loss": 0.2953, "learning_rate": 7.832842241526212e-06, "epoch": 0.6853804965114393, "percentage": 34.29, "elapsed_time": "6:22:46", "remaining_time": "12:13:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1058, "total_steps": 3080, "loss": 0.2902, "learning_rate": 7.823988422143942e-06, "epoch": 0.68667856563362, "percentage": 34.35, "elapsed_time": "6:23:24", "remaining_time": "12:12:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1060, "total_steps": 3080, "loss": 0.312, "learning_rate": 7.815121580877197e-06, "epoch": 0.6879766347558007, "percentage": 34.42, "elapsed_time": "6:24:01", "remaining_time": "12:11:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1062, "total_steps": 3080, "loss": 0.2721, "learning_rate": 7.806241758612471e-06, "epoch": 0.6892747038779815, "percentage": 34.48, "elapsed_time": "6:24:43", "remaining_time": "12:11:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1064, "total_steps": 3080, "loss": 0.3408, "learning_rate": 7.797348996296116e-06, "epoch": 0.6905727730001623, "percentage": 34.55, "elapsed_time": "6:25:28", "remaining_time": "12:10:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1066, "total_steps": 3080, "loss": 0.3036, "learning_rate": 7.788443334934148e-06, "epoch": 0.6918708421223431, "percentage": 34.61, "elapsed_time": "6:26:09", "remaining_time": "12:09:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1068, "total_steps": 3080, "loss": 0.2832, "learning_rate": 7.779524815592068e-06, "epoch": 0.6931689112445237, "percentage": 34.68, "elapsed_time": "6:26:48", "remaining_time": "12:08:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1070, "total_steps": 3080, "loss": 0.2845, "learning_rate": 7.770593479394664e-06, "epoch": 0.6944669803667045, "percentage": 34.74, "elapsed_time": "6:27:32", "remaining_time": "12:07:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1072, "total_steps": 3080, "loss": 0.2725, "learning_rate": 7.761649367525828e-06, "epoch": 0.6957650494888853, "percentage": 34.81, "elapsed_time": "6:28:16", "remaining_time": "12:07:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1074, "total_steps": 3080, "loss": 0.2757, "learning_rate": 7.752692521228357e-06, "epoch": 0.6970631186110661, "percentage": 34.87, "elapsed_time": "6:29:00", "remaining_time": "12:06:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1076, "total_steps": 3080, "loss": 0.2983, "learning_rate": 7.743722981803777e-06, "epoch": 0.6983611877332468, "percentage": 34.94, "elapsed_time": "6:29:37", "remaining_time": "12:05:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1078, "total_steps": 3080, "loss": 0.2903, "learning_rate": 7.734740790612137e-06, "epoch": 0.6996592568554275, "percentage": 35.0, "elapsed_time": "6:30:15", "remaining_time": "12:04:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1080, "total_steps": 3080, "loss": 0.265, "learning_rate": 7.725745989071825e-06, "epoch": 0.7009573259776083, "percentage": 35.06, "elapsed_time": "6:30:59", "remaining_time": "12:04:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1082, "total_steps": 3080, "loss": 0.3073, "learning_rate": 7.716738618659382e-06, "epoch": 0.7022553950997891, "percentage": 35.13, "elapsed_time": "6:31:44", "remaining_time": "12:03:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1084, "total_steps": 3080, "loss": 0.3093, "learning_rate": 7.707718720909308e-06, "epoch": 0.7035534642219698, "percentage": 35.19, "elapsed_time": "6:32:24", "remaining_time": "12:02:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1086, "total_steps": 3080, "loss": 0.2929, "learning_rate": 7.698686337413862e-06, "epoch": 0.7048515333441506, "percentage": 35.26, "elapsed_time": "6:33:06", "remaining_time": "12:01:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1088, "total_steps": 3080, "loss": 0.2523, "learning_rate": 7.689641509822879e-06, "epoch": 0.7061496024663313, "percentage": 35.32, "elapsed_time": "6:33:46", "remaining_time": "12:00:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1090, "total_steps": 3080, "loss": 0.2905, "learning_rate": 7.680584279843579e-06, "epoch": 0.7074476715885121, "percentage": 35.39, "elapsed_time": "6:34:29", "remaining_time": "12:00:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1092, "total_steps": 3080, "loss": 0.2932, "learning_rate": 7.671514689240366e-06, "epoch": 0.7087457407106929, "percentage": 35.45, "elapsed_time": "6:35:11", "remaining_time": "11:59:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1094, "total_steps": 3080, "loss": 0.2846, "learning_rate": 7.662432779834648e-06, "epoch": 0.7100438098328736, "percentage": 35.52, "elapsed_time": "6:35:50", "remaining_time": "11:58:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1096, "total_steps": 3080, "loss": 0.2658, "learning_rate": 7.653338593504632e-06, "epoch": 0.7113418789550544, "percentage": 35.58, "elapsed_time": "6:36:29", "remaining_time": "11:57:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1098, "total_steps": 3080, "loss": 0.3104, "learning_rate": 7.644232172185133e-06, "epoch": 0.7126399480772351, "percentage": 35.65, "elapsed_time": "6:37:05", "remaining_time": "11:56:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1100, "total_steps": 3080, "loss": 0.2621, "learning_rate": 7.635113557867395e-06, "epoch": 0.7139380171994159, "percentage": 35.71, "elapsed_time": "6:37:44", "remaining_time": "11:55:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1102, "total_steps": 3080, "loss": 0.3384, "learning_rate": 7.625982792598874e-06, "epoch": 0.7152360863215966, "percentage": 35.78, "elapsed_time": "6:38:28", "remaining_time": "11:55:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1104, "total_steps": 3080, "loss": 0.2787, "learning_rate": 7.616839918483061e-06, "epoch": 0.7165341554437774, "percentage": 35.84, "elapsed_time": "6:39:06", "remaining_time": "11:54:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1106, "total_steps": 3080, "loss": 0.2877, "learning_rate": 7.607684977679284e-06, "epoch": 0.7178322245659582, "percentage": 35.91, "elapsed_time": "6:39:50", "remaining_time": "11:53:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1108, "total_steps": 3080, "loss": 0.2774, "learning_rate": 7.598518012402509e-06, "epoch": 0.7191302936881389, "percentage": 35.97, "elapsed_time": "6:40:31", "remaining_time": "11:52:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1110, "total_steps": 3080, "loss": 0.2635, "learning_rate": 7.5893390649231555e-06, "epoch": 0.7204283628103196, "percentage": 36.04, "elapsed_time": "6:41:14", "remaining_time": "11:52:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1112, "total_steps": 3080, "loss": 0.2878, "learning_rate": 7.580148177566886e-06, "epoch": 0.7217264319325004, "percentage": 36.1, "elapsed_time": "6:41:52", "remaining_time": "11:51:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1114, "total_steps": 3080, "loss": 0.3085, "learning_rate": 7.5709453927144275e-06, "epoch": 0.7230245010546812, "percentage": 36.17, "elapsed_time": "6:42:33", "remaining_time": "11:50:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1116, "total_steps": 3080, "loss": 0.2655, "learning_rate": 7.561730752801364e-06, "epoch": 0.724322570176862, "percentage": 36.23, "elapsed_time": "6:43:12", "remaining_time": "11:49:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1118, "total_steps": 3080, "loss": 0.3159, "learning_rate": 7.552504300317944e-06, "epoch": 0.7256206392990426, "percentage": 36.3, "elapsed_time": "6:43:51", "remaining_time": "11:48:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1120, "total_steps": 3080, "loss": 0.2947, "learning_rate": 7.543266077808893e-06, "epoch": 0.7269187084212234, "percentage": 36.36, "elapsed_time": "6:44:30", "remaining_time": "11:47:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1122, "total_steps": 3080, "loss": 0.2815, "learning_rate": 7.5340161278732e-06, "epoch": 0.7282167775434042, "percentage": 36.43, "elapsed_time": "6:45:09", "remaining_time": "11:47:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1124, "total_steps": 3080, "loss": 0.2753, "learning_rate": 7.524754493163939e-06, "epoch": 0.729514846665585, "percentage": 36.49, "elapsed_time": "6:45:49", "remaining_time": "11:46:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1126, "total_steps": 3080, "loss": 0.2803, "learning_rate": 7.515481216388063e-06, "epoch": 0.7308129157877657, "percentage": 36.56, "elapsed_time": "6:46:34", "remaining_time": "11:45:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1128, "total_steps": 3080, "loss": 0.3105, "learning_rate": 7.506196340306204e-06, "epoch": 0.7321109849099464, "percentage": 36.62, "elapsed_time": "6:47:17", "remaining_time": "11:44:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1130, "total_steps": 3080, "loss": 0.2957, "learning_rate": 7.496899907732485e-06, "epoch": 0.7334090540321272, "percentage": 36.69, "elapsed_time": "6:47:55", "remaining_time": "11:43:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1132, "total_steps": 3080, "loss": 0.3114, "learning_rate": 7.487591961534319e-06, "epoch": 0.734707123154308, "percentage": 36.75, "elapsed_time": "6:48:33", "remaining_time": "11:43:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1134, "total_steps": 3080, "loss": 0.3076, "learning_rate": 7.478272544632204e-06, "epoch": 0.7360051922764888, "percentage": 36.82, "elapsed_time": "6:49:13", "remaining_time": "11:42:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1136, "total_steps": 3080, "loss": 0.2903, "learning_rate": 7.468941699999535e-06, "epoch": 0.7373032613986695, "percentage": 36.88, "elapsed_time": "6:49:53", "remaining_time": "11:41:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1138, "total_steps": 3080, "loss": 0.2498, "learning_rate": 7.4595994706624065e-06, "epoch": 0.7386013305208502, "percentage": 36.95, "elapsed_time": "6:50:36", "remaining_time": "11:40:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1140, "total_steps": 3080, "loss": 0.2836, "learning_rate": 7.450245899699401e-06, "epoch": 0.739899399643031, "percentage": 37.01, "elapsed_time": "6:51:15", "remaining_time": "11:39:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1142, "total_steps": 3080, "loss": 0.2799, "learning_rate": 7.440881030241407e-06, "epoch": 0.7411974687652118, "percentage": 37.08, "elapsed_time": "6:51:56", "remaining_time": "11:39:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1144, "total_steps": 3080, "loss": 0.2966, "learning_rate": 7.431504905471407e-06, "epoch": 0.7424955378873925, "percentage": 37.14, "elapsed_time": "6:52:39", "remaining_time": "11:38:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1146, "total_steps": 3080, "loss": 0.3034, "learning_rate": 7.422117568624288e-06, "epoch": 0.7437936070095733, "percentage": 37.21, "elapsed_time": "6:53:16", "remaining_time": "11:37:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1148, "total_steps": 3080, "loss": 0.2795, "learning_rate": 7.412719062986632e-06, "epoch": 0.745091676131754, "percentage": 37.27, "elapsed_time": "6:53:59", "remaining_time": "11:36:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1150, "total_steps": 3080, "loss": 0.2872, "learning_rate": 7.403309431896528e-06, "epoch": 0.7463897452539348, "percentage": 37.34, "elapsed_time": "6:54:37", "remaining_time": "11:35:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1152, "total_steps": 3080, "loss": 0.2747, "learning_rate": 7.393888718743362e-06, "epoch": 0.7476878143761155, "percentage": 37.4, "elapsed_time": "6:55:14", "remaining_time": "11:34:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1154, "total_steps": 3080, "loss": 0.2707, "learning_rate": 7.384456966967624e-06, "epoch": 0.7489858834982963, "percentage": 37.47, "elapsed_time": "6:55:58", "remaining_time": "11:34:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1156, "total_steps": 3080, "loss": 0.2773, "learning_rate": 7.375014220060705e-06, "epoch": 0.7502839526204771, "percentage": 37.53, "elapsed_time": "6:56:38", "remaining_time": "11:33:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1158, "total_steps": 3080, "loss": 0.2758, "learning_rate": 7.365560521564696e-06, "epoch": 0.7515820217426578, "percentage": 37.6, "elapsed_time": "6:57:18", "remaining_time": "11:32:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1160, "total_steps": 3080, "loss": 0.2951, "learning_rate": 7.3560959150721844e-06, "epoch": 0.7528800908648385, "percentage": 37.66, "elapsed_time": "6:58:00", "remaining_time": "11:31:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1162, "total_steps": 3080, "loss": 0.3057, "learning_rate": 7.3466204442260605e-06, "epoch": 0.7541781599870193, "percentage": 37.73, "elapsed_time": "6:58:40", "remaining_time": "11:31:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1164, "total_steps": 3080, "loss": 0.3171, "learning_rate": 7.337134152719312e-06, "epoch": 0.7554762291092001, "percentage": 37.79, "elapsed_time": "6:59:19", "remaining_time": "11:30:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1166, "total_steps": 3080, "loss": 0.2789, "learning_rate": 7.327637084294818e-06, "epoch": 0.7567742982313809, "percentage": 37.86, "elapsed_time": "6:59:59", "remaining_time": "11:29:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1168, "total_steps": 3080, "loss": 0.2784, "learning_rate": 7.318129282745152e-06, "epoch": 0.7580723673535615, "percentage": 37.92, "elapsed_time": "7:00:39", "remaining_time": "11:28:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1170, "total_steps": 3080, "loss": 0.3189, "learning_rate": 7.30861079191239e-06, "epoch": 0.7593704364757423, "percentage": 37.99, "elapsed_time": "7:01:26", "remaining_time": "11:27:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1172, "total_steps": 3080, "loss": 0.2832, "learning_rate": 7.299081655687885e-06, "epoch": 0.7606685055979231, "percentage": 38.05, "elapsed_time": "7:02:07", "remaining_time": "11:27:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1174, "total_steps": 3080, "loss": 0.2758, "learning_rate": 7.2895419180120855e-06, "epoch": 0.7619665747201039, "percentage": 38.12, "elapsed_time": "7:02:47", "remaining_time": "11:26:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1176, "total_steps": 3080, "loss": 0.261, "learning_rate": 7.279991622874319e-06, "epoch": 0.7632646438422847, "percentage": 38.18, "elapsed_time": "7:03:26", "remaining_time": "11:25:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1178, "total_steps": 3080, "loss": 0.3018, "learning_rate": 7.2704308143126035e-06, "epoch": 0.7645627129644653, "percentage": 38.25, "elapsed_time": "7:04:02", "remaining_time": "11:24:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1180, "total_steps": 3080, "loss": 0.2817, "learning_rate": 7.260859536413429e-06, "epoch": 0.7658607820866461, "percentage": 38.31, "elapsed_time": "7:04:41", "remaining_time": "11:23:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1182, "total_steps": 3080, "loss": 0.2765, "learning_rate": 7.251277833311565e-06, "epoch": 0.7671588512088269, "percentage": 38.38, "elapsed_time": "7:05:20", "remaining_time": "11:22:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1184, "total_steps": 3080, "loss": 0.2902, "learning_rate": 7.241685749189851e-06, "epoch": 0.7684569203310077, "percentage": 38.44, "elapsed_time": "7:06:06", "remaining_time": "11:22:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1186, "total_steps": 3080, "loss": 0.3157, "learning_rate": 7.2320833282789985e-06, "epoch": 0.7697549894531884, "percentage": 38.51, "elapsed_time": "7:06:47", "remaining_time": "11:21:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1188, "total_steps": 3080, "loss": 0.2672, "learning_rate": 7.22247061485738e-06, "epoch": 0.7710530585753691, "percentage": 38.57, "elapsed_time": "7:07:27", "remaining_time": "11:20:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1190, "total_steps": 3080, "loss": 0.2896, "learning_rate": 7.212847653250828e-06, "epoch": 0.7723511276975499, "percentage": 38.64, "elapsed_time": "7:08:04", "remaining_time": "11:19:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1192, "total_steps": 3080, "loss": 0.2868, "learning_rate": 7.203214487832437e-06, "epoch": 0.7736491968197307, "percentage": 38.7, "elapsed_time": "7:08:45", "remaining_time": "11:19:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1194, "total_steps": 3080, "loss": 0.2774, "learning_rate": 7.193571163022348e-06, "epoch": 0.7749472659419114, "percentage": 38.77, "elapsed_time": "7:09:23", "remaining_time": "11:18:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1196, "total_steps": 3080, "loss": 0.2881, "learning_rate": 7.18391772328755e-06, "epoch": 0.7762453350640922, "percentage": 38.83, "elapsed_time": "7:09:59", "remaining_time": "11:17:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1198, "total_steps": 3080, "loss": 0.29, "learning_rate": 7.174254213141671e-06, "epoch": 0.7775434041862729, "percentage": 38.9, "elapsed_time": "7:10:40", "remaining_time": "11:16:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1200, "total_steps": 3080, "loss": 0.3319, "learning_rate": 7.164580677144781e-06, "epoch": 0.7788414733084537, "percentage": 38.96, "elapsed_time": "7:11:22", "remaining_time": "11:15:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1202, "total_steps": 3080, "loss": 0.2775, "learning_rate": 7.154897159903178e-06, "epoch": 0.7801395424306344, "percentage": 39.03, "elapsed_time": "7:12:02", "remaining_time": "11:15:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1204, "total_steps": 3080, "loss": 0.2708, "learning_rate": 7.145203706069183e-06, "epoch": 0.7814376115528152, "percentage": 39.09, "elapsed_time": "7:12:37", "remaining_time": "11:14:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1206, "total_steps": 3080, "loss": 0.2911, "learning_rate": 7.135500360340937e-06, "epoch": 0.782735680674996, "percentage": 39.16, "elapsed_time": "7:13:17", "remaining_time": "11:13:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1208, "total_steps": 3080, "loss": 0.29, "learning_rate": 7.125787167462197e-06, "epoch": 0.7840337497971767, "percentage": 39.22, "elapsed_time": "7:13:59", "remaining_time": "11:12:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1210, "total_steps": 3080, "loss": 0.275, "learning_rate": 7.1160641722221255e-06, "epoch": 0.7853318189193574, "percentage": 39.29, "elapsed_time": "7:14:41", "remaining_time": "11:11:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1212, "total_steps": 3080, "loss": 0.2888, "learning_rate": 7.106331419455085e-06, "epoch": 0.7866298880415382, "percentage": 39.35, "elapsed_time": "7:15:20", "remaining_time": "11:10:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1214, "total_steps": 3080, "loss": 0.2862, "learning_rate": 7.09658895404043e-06, "epoch": 0.787927957163719, "percentage": 39.42, "elapsed_time": "7:16:01", "remaining_time": "11:10:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1216, "total_steps": 3080, "loss": 0.266, "learning_rate": 7.086836820902305e-06, "epoch": 0.7892260262858998, "percentage": 39.48, "elapsed_time": "7:16:39", "remaining_time": "11:09:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1218, "total_steps": 3080, "loss": 0.275, "learning_rate": 7.0770750650094335e-06, "epoch": 0.7905240954080804, "percentage": 39.55, "elapsed_time": "7:17:19", "remaining_time": "11:08:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1220, "total_steps": 3080, "loss": 0.2837, "learning_rate": 7.067303731374907e-06, "epoch": 0.7918221645302612, "percentage": 39.61, "elapsed_time": "7:18:03", "remaining_time": "11:07:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1222, "total_steps": 3080, "loss": 0.306, "learning_rate": 7.057522865055985e-06, "epoch": 0.793120233652442, "percentage": 39.68, "elapsed_time": "7:18:43", "remaining_time": "11:07:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1224, "total_steps": 3080, "loss": 0.3098, "learning_rate": 7.047732511153885e-06, "epoch": 0.7944183027746228, "percentage": 39.74, "elapsed_time": "7:19:20", "remaining_time": "11:06:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1226, "total_steps": 3080, "loss": 0.2586, "learning_rate": 7.037932714813572e-06, "epoch": 0.7957163718968036, "percentage": 39.81, "elapsed_time": "7:20:00", "remaining_time": "11:05:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1228, "total_steps": 3080, "loss": 0.2803, "learning_rate": 7.028123521223548e-06, "epoch": 0.7970144410189842, "percentage": 39.87, "elapsed_time": "7:20:39", "remaining_time": "11:04:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1230, "total_steps": 3080, "loss": 0.298, "learning_rate": 7.018304975615653e-06, "epoch": 0.798312510141165, "percentage": 39.94, "elapsed_time": "7:21:19", "remaining_time": "11:03:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1232, "total_steps": 3080, "loss": 0.2967, "learning_rate": 7.008477123264849e-06, "epoch": 0.7996105792633458, "percentage": 40.0, "elapsed_time": "7:22:00", "remaining_time": "11:03:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1234, "total_steps": 3080, "loss": 0.2749, "learning_rate": 6.998640009489009e-06, "epoch": 0.8009086483855266, "percentage": 40.06, "elapsed_time": "7:22:39", "remaining_time": "11:02:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1236, "total_steps": 3080, "loss": 0.2981, "learning_rate": 6.98879367964872e-06, "epoch": 0.8022067175077073, "percentage": 40.13, "elapsed_time": "7:23:22", "remaining_time": "11:01:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1238, "total_steps": 3080, "loss": 0.3354, "learning_rate": 6.9789381791470575e-06, "epoch": 0.803504786629888, "percentage": 40.19, "elapsed_time": "7:24:01", "remaining_time": "11:00:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1240, "total_steps": 3080, "loss": 0.2865, "learning_rate": 6.969073553429388e-06, "epoch": 0.8048028557520688, "percentage": 40.26, "elapsed_time": "7:24:42", "remaining_time": "10:59:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1242, "total_steps": 3080, "loss": 0.3201, "learning_rate": 6.95919984798316e-06, "epoch": 0.8061009248742496, "percentage": 40.32, "elapsed_time": "7:25:22", "remaining_time": "10:59:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1244, "total_steps": 3080, "loss": 0.263, "learning_rate": 6.949317108337681e-06, "epoch": 0.8073989939964303, "percentage": 40.39, "elapsed_time": "7:26:03", "remaining_time": "10:58:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1246, "total_steps": 3080, "loss": 0.2917, "learning_rate": 6.939425380063924e-06, "epoch": 0.8086970631186111, "percentage": 40.45, "elapsed_time": "7:26:44", "remaining_time": "10:57:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1248, "total_steps": 3080, "loss": 0.2569, "learning_rate": 6.92952470877431e-06, "epoch": 0.8099951322407918, "percentage": 40.52, "elapsed_time": "7:27:23", "remaining_time": "10:56:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1250, "total_steps": 3080, "loss": 0.2654, "learning_rate": 6.919615140122492e-06, "epoch": 0.8112932013629726, "percentage": 40.58, "elapsed_time": "7:28:03", "remaining_time": "10:55:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1252, "total_steps": 3080, "loss": 0.2873, "learning_rate": 6.909696719803156e-06, "epoch": 0.8125912704851533, "percentage": 40.65, "elapsed_time": "7:28:44", "remaining_time": "10:55:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1254, "total_steps": 3080, "loss": 0.2817, "learning_rate": 6.8997694935518e-06, "epoch": 0.8138893396073341, "percentage": 40.71, "elapsed_time": "7:29:27", "remaining_time": "10:54:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1256, "total_steps": 3080, "loss": 0.2734, "learning_rate": 6.889833507144534e-06, "epoch": 0.8151874087295149, "percentage": 40.78, "elapsed_time": "7:30:05", "remaining_time": "10:53:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1258, "total_steps": 3080, "loss": 0.2815, "learning_rate": 6.879888806397855e-06, "epoch": 0.8164854778516956, "percentage": 40.84, "elapsed_time": "7:30:42", "remaining_time": "10:52:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1260, "total_steps": 3080, "loss": 0.2949, "learning_rate": 6.869935437168449e-06, "epoch": 0.8177835469738763, "percentage": 40.91, "elapsed_time": "7:31:19", "remaining_time": "10:51:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1262, "total_steps": 3080, "loss": 0.2536, "learning_rate": 6.85997344535297e-06, "epoch": 0.8190816160960571, "percentage": 40.97, "elapsed_time": "7:32:01", "remaining_time": "10:51:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1264, "total_steps": 3080, "loss": 0.259, "learning_rate": 6.850002876887836e-06, "epoch": 0.8203796852182379, "percentage": 41.04, "elapsed_time": "7:32:40", "remaining_time": "10:50:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1266, "total_steps": 3080, "loss": 0.2846, "learning_rate": 6.840023777749008e-06, "epoch": 0.8216777543404187, "percentage": 41.1, "elapsed_time": "7:33:20", "remaining_time": "10:49:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1268, "total_steps": 3080, "loss": 0.3429, "learning_rate": 6.83003619395179e-06, "epoch": 0.8229758234625993, "percentage": 41.17, "elapsed_time": "7:34:01", "remaining_time": "10:48:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1270, "total_steps": 3080, "loss": 0.2811, "learning_rate": 6.8200401715506045e-06, "epoch": 0.8242738925847801, "percentage": 41.23, "elapsed_time": "7:34:43", "remaining_time": "10:48:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1272, "total_steps": 3080, "loss": 0.275, "learning_rate": 6.81003575663879e-06, "epoch": 0.8255719617069609, "percentage": 41.3, "elapsed_time": "7:35:25", "remaining_time": "10:47:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1274, "total_steps": 3080, "loss": 0.2965, "learning_rate": 6.800022995348381e-06, "epoch": 0.8268700308291417, "percentage": 41.36, "elapsed_time": "7:36:06", "remaining_time": "10:46:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1276, "total_steps": 3080, "loss": 0.2738, "learning_rate": 6.7900019338499005e-06, "epoch": 0.8281680999513225, "percentage": 41.43, "elapsed_time": "7:36:46", "remaining_time": "10:45:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1278, "total_steps": 3080, "loss": 0.2727, "learning_rate": 6.779972618352143e-06, "epoch": 0.8294661690735031, "percentage": 41.49, "elapsed_time": "7:37:27", "remaining_time": "10:45:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1280, "total_steps": 3080, "loss": 0.257, "learning_rate": 6.7699350951019685e-06, "epoch": 0.8307642381956839, "percentage": 41.56, "elapsed_time": "7:38:10", "remaining_time": "10:44:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1282, "total_steps": 3080, "loss": 0.2994, "learning_rate": 6.759889410384078e-06, "epoch": 0.8320623073178647, "percentage": 41.62, "elapsed_time": "7:38:48", "remaining_time": "10:43:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1284, "total_steps": 3080, "loss": 0.2651, "learning_rate": 6.74983561052081e-06, "epoch": 0.8333603764400455, "percentage": 41.69, "elapsed_time": "7:39:33", "remaining_time": "10:42:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1286, "total_steps": 3080, "loss": 0.2675, "learning_rate": 6.739773741871924e-06, "epoch": 0.8346584455622262, "percentage": 41.75, "elapsed_time": "7:40:13", "remaining_time": "10:42:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1288, "total_steps": 3080, "loss": 0.2853, "learning_rate": 6.729703850834381e-06, "epoch": 0.8359565146844069, "percentage": 41.82, "elapsed_time": "7:40:54", "remaining_time": "10:41:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1290, "total_steps": 3080, "loss": 0.26, "learning_rate": 6.719625983842144e-06, "epoch": 0.8372545838065877, "percentage": 41.88, "elapsed_time": "7:41:36", "remaining_time": "10:40:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1292, "total_steps": 3080, "loss": 0.2932, "learning_rate": 6.7095401873659446e-06, "epoch": 0.8385526529287685, "percentage": 41.95, "elapsed_time": "7:42:19", "remaining_time": "10:39:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1294, "total_steps": 3080, "loss": 0.2733, "learning_rate": 6.699446507913083e-06, "epoch": 0.8398507220509492, "percentage": 42.01, "elapsed_time": "7:42:58", "remaining_time": "10:39:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1296, "total_steps": 3080, "loss": 0.2729, "learning_rate": 6.689344992027213e-06, "epoch": 0.84114879117313, "percentage": 42.08, "elapsed_time": "7:43:36", "remaining_time": "10:38:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1298, "total_steps": 3080, "loss": 0.2801, "learning_rate": 6.6792356862881144e-06, "epoch": 0.8424468602953107, "percentage": 42.14, "elapsed_time": "7:44:17", "remaining_time": "10:37:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1300, "total_steps": 3080, "loss": 0.2754, "learning_rate": 6.669118637311491e-06, "epoch": 0.8437449294174915, "percentage": 42.21, "elapsed_time": "7:44:56", "remaining_time": "10:36:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1302, "total_steps": 3080, "loss": 0.3015, "learning_rate": 6.65899389174876e-06, "epoch": 0.8450429985396722, "percentage": 42.27, "elapsed_time": "7:45:37", "remaining_time": "10:35:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1304, "total_steps": 3080, "loss": 0.2583, "learning_rate": 6.648861496286818e-06, "epoch": 0.846341067661853, "percentage": 42.34, "elapsed_time": "7:46:16", "remaining_time": "10:35:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1306, "total_steps": 3080, "loss": 0.2926, "learning_rate": 6.63872149764784e-06, "epoch": 0.8476391367840338, "percentage": 42.4, "elapsed_time": "7:46:54", "remaining_time": "10:34:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1308, "total_steps": 3080, "loss": 0.2621, "learning_rate": 6.628573942589062e-06, "epoch": 0.8489372059062145, "percentage": 42.47, "elapsed_time": "7:47:34", "remaining_time": "10:33:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1310, "total_steps": 3080, "loss": 0.2859, "learning_rate": 6.618418877902563e-06, "epoch": 0.8502352750283952, "percentage": 42.53, "elapsed_time": "7:48:15", "remaining_time": "10:32:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1312, "total_steps": 3080, "loss": 0.2694, "learning_rate": 6.608256350415052e-06, "epoch": 0.851533344150576, "percentage": 42.6, "elapsed_time": "7:48:54", "remaining_time": "10:31:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1314, "total_steps": 3080, "loss": 0.3035, "learning_rate": 6.598086406987647e-06, "epoch": 0.8528314132727568, "percentage": 42.66, "elapsed_time": "7:49:40", "remaining_time": "10:31:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1316, "total_steps": 3080, "loss": 0.2932, "learning_rate": 6.587909094515663e-06, "epoch": 0.8541294823949376, "percentage": 42.73, "elapsed_time": "7:50:19", "remaining_time": "10:30:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1318, "total_steps": 3080, "loss": 0.2692, "learning_rate": 6.577724459928396e-06, "epoch": 0.8554275515171182, "percentage": 42.79, "elapsed_time": "7:50:56", "remaining_time": "10:29:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1320, "total_steps": 3080, "loss": 0.2803, "learning_rate": 6.567532550188908e-06, "epoch": 0.856725620639299, "percentage": 42.86, "elapsed_time": "7:51:38", "remaining_time": "10:28:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1322, "total_steps": 3080, "loss": 0.2861, "learning_rate": 6.5573334122938e-06, "epoch": 0.8580236897614798, "percentage": 42.92, "elapsed_time": "7:52:15", "remaining_time": "10:28:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1324, "total_steps": 3080, "loss": 0.2783, "learning_rate": 6.547127093273009e-06, "epoch": 0.8593217588836606, "percentage": 42.99, "elapsed_time": "7:52:56", "remaining_time": "10:27:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1326, "total_steps": 3080, "loss": 0.285, "learning_rate": 6.536913640189588e-06, "epoch": 0.8606198280058414, "percentage": 43.05, "elapsed_time": "7:53:36", "remaining_time": "10:26:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1328, "total_steps": 3080, "loss": 0.2985, "learning_rate": 6.526693100139481e-06, "epoch": 0.861917897128022, "percentage": 43.12, "elapsed_time": "7:54:13", "remaining_time": "10:25:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1330, "total_steps": 3080, "loss": 0.3166, "learning_rate": 6.5164655202513135e-06, "epoch": 0.8632159662502028, "percentage": 43.18, "elapsed_time": "7:54:52", "remaining_time": "10:24:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1332, "total_steps": 3080, "loss": 0.2808, "learning_rate": 6.5062309476861714e-06, "epoch": 0.8645140353723836, "percentage": 43.25, "elapsed_time": "7:55:35", "remaining_time": "10:24:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1334, "total_steps": 3080, "loss": 0.2821, "learning_rate": 6.495989429637388e-06, "epoch": 0.8658121044945644, "percentage": 43.31, "elapsed_time": "7:56:16", "remaining_time": "10:23:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1336, "total_steps": 3080, "loss": 0.2667, "learning_rate": 6.485741013330321e-06, "epoch": 0.8671101736167451, "percentage": 43.38, "elapsed_time": "7:56:52", "remaining_time": "10:22:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1338, "total_steps": 3080, "loss": 0.2621, "learning_rate": 6.475485746022136e-06, "epoch": 0.8684082427389258, "percentage": 43.44, "elapsed_time": "7:57:32", "remaining_time": "10:21:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1340, "total_steps": 3080, "loss": 0.2907, "learning_rate": 6.465223675001593e-06, "epoch": 0.8697063118611066, "percentage": 43.51, "elapsed_time": "7:58:10", "remaining_time": "10:20:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1342, "total_steps": 3080, "loss": 0.3039, "learning_rate": 6.454954847588824e-06, "epoch": 0.8710043809832874, "percentage": 43.57, "elapsed_time": "7:58:45", "remaining_time": "10:20:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1344, "total_steps": 3080, "loss": 0.2774, "learning_rate": 6.444679311135112e-06, "epoch": 0.8723024501054681, "percentage": 43.64, "elapsed_time": "7:59:24", "remaining_time": "10:19:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1346, "total_steps": 3080, "loss": 0.3136, "learning_rate": 6.434397113022683e-06, "epoch": 0.8736005192276489, "percentage": 43.7, "elapsed_time": "8:00:09", "remaining_time": "10:18:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1348, "total_steps": 3080, "loss": 0.2827, "learning_rate": 6.424108300664479e-06, "epoch": 0.8748985883498296, "percentage": 43.77, "elapsed_time": "8:00:46", "remaining_time": "10:17:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1350, "total_steps": 3080, "loss": 0.2842, "learning_rate": 6.4138129215039356e-06, "epoch": 0.8761966574720104, "percentage": 43.83, "elapsed_time": "8:01:24", "remaining_time": "10:16:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1352, "total_steps": 3080, "loss": 0.301, "learning_rate": 6.403511023014778e-06, "epoch": 0.8774947265941911, "percentage": 43.9, "elapsed_time": "8:02:03", "remaining_time": "10:16:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1354, "total_steps": 3080, "loss": 0.3835, "learning_rate": 6.393202652700785e-06, "epoch": 0.8787927957163719, "percentage": 43.96, "elapsed_time": "8:02:47", "remaining_time": "10:15:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1356, "total_steps": 3080, "loss": 0.2821, "learning_rate": 6.382887858095585e-06, "epoch": 0.8800908648385527, "percentage": 44.03, "elapsed_time": "8:03:26", "remaining_time": "10:14:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1358, "total_steps": 3080, "loss": 0.2718, "learning_rate": 6.372566686762427e-06, "epoch": 0.8813889339607334, "percentage": 44.09, "elapsed_time": "8:04:06", "remaining_time": "10:13:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1360, "total_steps": 3080, "loss": 0.2558, "learning_rate": 6.3622391862939606e-06, "epoch": 0.8826870030829141, "percentage": 44.16, "elapsed_time": "8:04:43", "remaining_time": "10:13:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1362, "total_steps": 3080, "loss": 0.2787, "learning_rate": 6.351905404312026e-06, "epoch": 0.8839850722050949, "percentage": 44.22, "elapsed_time": "8:05:21", "remaining_time": "10:12:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1364, "total_steps": 3080, "loss": 0.2801, "learning_rate": 6.341565388467425e-06, "epoch": 0.8852831413272757, "percentage": 44.29, "elapsed_time": "8:06:03", "remaining_time": "10:11:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1366, "total_steps": 3080, "loss": 0.2925, "learning_rate": 6.3312191864397045e-06, "epoch": 0.8865812104494565, "percentage": 44.35, "elapsed_time": "8:06:42", "remaining_time": "10:10:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1368, "total_steps": 3080, "loss": 0.2819, "learning_rate": 6.320866845936942e-06, "epoch": 0.8878792795716371, "percentage": 44.42, "elapsed_time": "8:07:21", "remaining_time": "10:09:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1370, "total_steps": 3080, "loss": 0.2737, "learning_rate": 6.310508414695511e-06, "epoch": 0.8891773486938179, "percentage": 44.48, "elapsed_time": "8:07:57", "remaining_time": "10:09:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1372, "total_steps": 3080, "loss": 0.2751, "learning_rate": 6.300143940479881e-06, "epoch": 0.8904754178159987, "percentage": 44.55, "elapsed_time": "8:08:33", "remaining_time": "10:08:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1374, "total_steps": 3080, "loss": 0.3036, "learning_rate": 6.289773471082381e-06, "epoch": 0.8917734869381795, "percentage": 44.61, "elapsed_time": "8:09:13", "remaining_time": "10:07:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1376, "total_steps": 3080, "loss": 0.2818, "learning_rate": 6.279397054322983e-06, "epoch": 0.8930715560603603, "percentage": 44.68, "elapsed_time": "8:09:55", "remaining_time": "10:06:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1378, "total_steps": 3080, "loss": 0.2611, "learning_rate": 6.269014738049088e-06, "epoch": 0.8943696251825409, "percentage": 44.74, "elapsed_time": "8:10:39", "remaining_time": "10:06:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1380, "total_steps": 3080, "loss": 0.2707, "learning_rate": 6.2586265701352976e-06, "epoch": 0.8956676943047217, "percentage": 44.81, "elapsed_time": "8:11:21", "remaining_time": "10:05:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1382, "total_steps": 3080, "loss": 0.2909, "learning_rate": 6.248232598483196e-06, "epoch": 0.8969657634269025, "percentage": 44.87, "elapsed_time": "8:11:58", "remaining_time": "10:04:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1384, "total_steps": 3080, "loss": 0.2844, "learning_rate": 6.2378328710211345e-06, "epoch": 0.8982638325490833, "percentage": 44.94, "elapsed_time": "8:12:37", "remaining_time": "10:03:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1386, "total_steps": 3080, "loss": 0.2605, "learning_rate": 6.227427435703997e-06, "epoch": 0.899561901671264, "percentage": 45.0, "elapsed_time": "8:13:19", "remaining_time": "10:02:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1388, "total_steps": 3080, "loss": 0.2716, "learning_rate": 6.217016340512993e-06, "epoch": 0.9008599707934447, "percentage": 45.06, "elapsed_time": "8:14:00", "remaining_time": "10:02:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1390, "total_steps": 3080, "loss": 0.286, "learning_rate": 6.2065996334554325e-06, "epoch": 0.9021580399156255, "percentage": 45.13, "elapsed_time": "8:14:40", "remaining_time": "10:01:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1392, "total_steps": 3080, "loss": 0.2795, "learning_rate": 6.196177362564495e-06, "epoch": 0.9034561090378063, "percentage": 45.19, "elapsed_time": "8:15:19", "remaining_time": "10:00:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1394, "total_steps": 3080, "loss": 0.3156, "learning_rate": 6.185749575899023e-06, "epoch": 0.904754178159987, "percentage": 45.26, "elapsed_time": "8:15:57", "remaining_time": "9:59:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1396, "total_steps": 3080, "loss": 0.3009, "learning_rate": 6.175316321543291e-06, "epoch": 0.9060522472821678, "percentage": 45.32, "elapsed_time": "8:16:37", "remaining_time": "9:59:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1398, "total_steps": 3080, "loss": 0.2942, "learning_rate": 6.164877647606784e-06, "epoch": 0.9073503164043485, "percentage": 45.39, "elapsed_time": "8:17:17", "remaining_time": "9:58:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1400, "total_steps": 3080, "loss": 0.2841, "learning_rate": 6.154433602223979e-06, "epoch": 0.9086483855265293, "percentage": 45.45, "elapsed_time": "8:17:55", "remaining_time": "9:57:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1402, "total_steps": 3080, "loss": 0.27, "learning_rate": 6.143984233554125e-06, "epoch": 0.90994645464871, "percentage": 45.52, "elapsed_time": "8:18:37", "remaining_time": "9:56:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1404, "total_steps": 3080, "loss": 0.2811, "learning_rate": 6.13352958978101e-06, "epoch": 0.9112445237708908, "percentage": 45.58, "elapsed_time": "8:19:24", "remaining_time": "9:56:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1406, "total_steps": 3080, "loss": 0.3019, "learning_rate": 6.123069719112754e-06, "epoch": 0.9125425928930716, "percentage": 45.65, "elapsed_time": "8:19:59", "remaining_time": "9:55:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1408, "total_steps": 3080, "loss": 0.2985, "learning_rate": 6.112604669781572e-06, "epoch": 0.9138406620152523, "percentage": 45.71, "elapsed_time": "8:20:39", "remaining_time": "9:54:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1410, "total_steps": 3080, "loss": 0.2675, "learning_rate": 6.102134490043566e-06, "epoch": 0.915138731137433, "percentage": 45.78, "elapsed_time": "8:21:23", "remaining_time": "9:53:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1412, "total_steps": 3080, "loss": 0.2914, "learning_rate": 6.091659228178492e-06, "epoch": 0.9164368002596138, "percentage": 45.84, "elapsed_time": "8:22:05", "remaining_time": "9:53:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1414, "total_steps": 3080, "loss": 0.2768, "learning_rate": 6.0811789324895365e-06, "epoch": 0.9177348693817946, "percentage": 45.91, "elapsed_time": "8:22:49", "remaining_time": "9:52:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1416, "total_steps": 3080, "loss": 0.2829, "learning_rate": 6.070693651303105e-06, "epoch": 0.9190329385039754, "percentage": 45.97, "elapsed_time": "8:23:25", "remaining_time": "9:51:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1418, "total_steps": 3080, "loss": 0.2554, "learning_rate": 6.060203432968587e-06, "epoch": 0.920331007626156, "percentage": 46.04, "elapsed_time": "8:24:04", "remaining_time": "9:50:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1420, "total_steps": 3080, "loss": 0.284, "learning_rate": 6.049708325858139e-06, "epoch": 0.9216290767483368, "percentage": 46.1, "elapsed_time": "8:24:44", "remaining_time": "9:50:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1422, "total_steps": 3080, "loss": 0.2746, "learning_rate": 6.039208378366462e-06, "epoch": 0.9229271458705176, "percentage": 46.17, "elapsed_time": "8:25:24", "remaining_time": "9:49:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1424, "total_steps": 3080, "loss": 0.2752, "learning_rate": 6.028703638910574e-06, "epoch": 0.9242252149926984, "percentage": 46.23, "elapsed_time": "8:26:06", "remaining_time": "9:48:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1426, "total_steps": 3080, "loss": 0.2595, "learning_rate": 6.018194155929594e-06, "epoch": 0.9255232841148792, "percentage": 46.3, "elapsed_time": "8:26:44", "remaining_time": "9:47:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1428, "total_steps": 3080, "loss": 0.3008, "learning_rate": 6.0076799778845105e-06, "epoch": 0.9268213532370598, "percentage": 46.36, "elapsed_time": "8:27:23", "remaining_time": "9:46:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1430, "total_steps": 3080, "loss": 0.2936, "learning_rate": 5.997161153257963e-06, "epoch": 0.9281194223592406, "percentage": 46.43, "elapsed_time": "8:28:00", "remaining_time": "9:46:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1432, "total_steps": 3080, "loss": 0.2648, "learning_rate": 5.986637730554014e-06, "epoch": 0.9294174914814214, "percentage": 46.49, "elapsed_time": "8:28:44", "remaining_time": "9:45:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1434, "total_steps": 3080, "loss": 0.3054, "learning_rate": 5.976109758297934e-06, "epoch": 0.9307155606036022, "percentage": 46.56, "elapsed_time": "8:29:23", "remaining_time": "9:44:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1436, "total_steps": 3080, "loss": 0.2907, "learning_rate": 5.96557728503597e-06, "epoch": 0.9320136297257829, "percentage": 46.62, "elapsed_time": "8:30:09", "remaining_time": "9:44:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1438, "total_steps": 3080, "loss": 0.269, "learning_rate": 5.955040359335123e-06, "epoch": 0.9333116988479636, "percentage": 46.69, "elapsed_time": "8:30:47", "remaining_time": "9:43:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1440, "total_steps": 3080, "loss": 0.2837, "learning_rate": 5.944499029782924e-06, "epoch": 0.9346097679701444, "percentage": 46.75, "elapsed_time": "8:31:26", "remaining_time": "9:42:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1442, "total_steps": 3080, "loss": 0.2616, "learning_rate": 5.933953344987215e-06, "epoch": 0.9359078370923252, "percentage": 46.82, "elapsed_time": "8:32:07", "remaining_time": "9:41:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1444, "total_steps": 3080, "loss": 0.2896, "learning_rate": 5.923403353575916e-06, "epoch": 0.937205906214506, "percentage": 46.88, "elapsed_time": "8:32:46", "remaining_time": "9:40:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1446, "total_steps": 3080, "loss": 0.2879, "learning_rate": 5.91284910419681e-06, "epoch": 0.9385039753366867, "percentage": 46.95, "elapsed_time": "8:33:25", "remaining_time": "9:40:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1448, "total_steps": 3080, "loss": 0.3009, "learning_rate": 5.902290645517308e-06, "epoch": 0.9398020444588674, "percentage": 47.01, "elapsed_time": "8:34:05", "remaining_time": "9:39:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1450, "total_steps": 3080, "loss": 0.2906, "learning_rate": 5.891728026224238e-06, "epoch": 0.9411001135810482, "percentage": 47.08, "elapsed_time": "8:34:49", "remaining_time": "9:38:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1452, "total_steps": 3080, "loss": 0.2719, "learning_rate": 5.88116129502361e-06, "epoch": 0.942398182703229, "percentage": 47.14, "elapsed_time": "8:35:30", "remaining_time": "9:37:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1454, "total_steps": 3080, "loss": 0.2845, "learning_rate": 5.870590500640392e-06, "epoch": 0.9436962518254097, "percentage": 47.21, "elapsed_time": "8:36:11", "remaining_time": "9:37:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1456, "total_steps": 3080, "loss": 0.2668, "learning_rate": 5.860015691818292e-06, "epoch": 0.9449943209475905, "percentage": 47.27, "elapsed_time": "8:36:51", "remaining_time": "9:36:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1458, "total_steps": 3080, "loss": 0.2694, "learning_rate": 5.84943691731953e-06, "epoch": 0.9462923900697712, "percentage": 47.34, "elapsed_time": "8:37:27", "remaining_time": "9:35:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1460, "total_steps": 3080, "loss": 0.2901, "learning_rate": 5.838854225924607e-06, "epoch": 0.947590459191952, "percentage": 47.4, "elapsed_time": "8:38:09", "remaining_time": "9:34:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1462, "total_steps": 3080, "loss": 0.2852, "learning_rate": 5.82826766643209e-06, "epoch": 0.9488885283141327, "percentage": 47.47, "elapsed_time": "8:38:50", "remaining_time": "9:34:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1464, "total_steps": 3080, "loss": 0.3003, "learning_rate": 5.817677287658382e-06, "epoch": 0.9501865974363135, "percentage": 47.53, "elapsed_time": "8:39:33", "remaining_time": "9:33:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1466, "total_steps": 3080, "loss": 0.2643, "learning_rate": 5.807083138437497e-06, "epoch": 0.9514846665584943, "percentage": 47.6, "elapsed_time": "8:40:06", "remaining_time": "9:32:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1468, "total_steps": 3080, "loss": 0.2951, "learning_rate": 5.796485267620834e-06, "epoch": 0.952782735680675, "percentage": 47.66, "elapsed_time": "8:40:45", "remaining_time": "9:31:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1470, "total_steps": 3080, "loss": 0.2741, "learning_rate": 5.78588372407695e-06, "epoch": 0.9540808048028557, "percentage": 47.73, "elapsed_time": "8:41:26", "remaining_time": "9:31:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1472, "total_steps": 3080, "loss": 0.291, "learning_rate": 5.7752785566913484e-06, "epoch": 0.9553788739250365, "percentage": 47.79, "elapsed_time": "8:42:07", "remaining_time": "9:30:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1474, "total_steps": 3080, "loss": 0.3024, "learning_rate": 5.764669814366231e-06, "epoch": 0.9566769430472173, "percentage": 47.86, "elapsed_time": "8:42:49", "remaining_time": "9:29:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1476, "total_steps": 3080, "loss": 0.3108, "learning_rate": 5.754057546020289e-06, "epoch": 0.9579750121693981, "percentage": 47.92, "elapsed_time": "8:43:29", "remaining_time": "9:28:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1478, "total_steps": 3080, "loss": 0.2684, "learning_rate": 5.743441800588472e-06, "epoch": 0.9592730812915787, "percentage": 47.99, "elapsed_time": "8:44:09", "remaining_time": "9:28:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1480, "total_steps": 3080, "loss": 0.2902, "learning_rate": 5.732822627021765e-06, "epoch": 0.9605711504137595, "percentage": 48.05, "elapsed_time": "8:44:49", "remaining_time": "9:27:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1482, "total_steps": 3080, "loss": 0.2946, "learning_rate": 5.722200074286959e-06, "epoch": 0.9618692195359403, "percentage": 48.12, "elapsed_time": "8:45:32", "remaining_time": "9:26:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1484, "total_steps": 3080, "loss": 0.3033, "learning_rate": 5.711574191366427e-06, "epoch": 0.9631672886581211, "percentage": 48.18, "elapsed_time": "8:46:11", "remaining_time": "9:25:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1486, "total_steps": 3080, "loss": 0.2756, "learning_rate": 5.700945027257896e-06, "epoch": 0.9644653577803018, "percentage": 48.25, "elapsed_time": "8:46:55", "remaining_time": "9:25:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1488, "total_steps": 3080, "loss": 0.2784, "learning_rate": 5.690312630974229e-06, "epoch": 0.9657634269024825, "percentage": 48.31, "elapsed_time": "8:47:35", "remaining_time": "9:24:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1490, "total_steps": 3080, "loss": 0.2736, "learning_rate": 5.6796770515431886e-06, "epoch": 0.9670614960246633, "percentage": 48.38, "elapsed_time": "8:48:13", "remaining_time": "9:23:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1492, "total_steps": 3080, "loss": 0.2638, "learning_rate": 5.6690383380072136e-06, "epoch": 0.9683595651468441, "percentage": 48.44, "elapsed_time": "8:48:54", "remaining_time": "9:22:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1494, "total_steps": 3080, "loss": 0.2518, "learning_rate": 5.658396539423197e-06, "epoch": 0.9696576342690248, "percentage": 48.51, "elapsed_time": "8:49:35", "remaining_time": "9:22:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1496, "total_steps": 3080, "loss": 0.2709, "learning_rate": 5.647751704862263e-06, "epoch": 0.9709557033912056, "percentage": 48.57, "elapsed_time": "8:50:16", "remaining_time": "9:21:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1498, "total_steps": 3080, "loss": 0.2967, "learning_rate": 5.637103883409525e-06, "epoch": 0.9722537725133863, "percentage": 48.64, "elapsed_time": "8:50:58", "remaining_time": "9:20:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1500, "total_steps": 3080, "loss": 0.264, "learning_rate": 5.626453124163876e-06, "epoch": 0.9735518416355671, "percentage": 48.7, "elapsed_time": "8:51:40", "remaining_time": "9:20:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1500, "total_steps": 3080, "eval_loss": 0.28451454639434814, "epoch": 0.9735518416355671, "percentage": 48.7, "elapsed_time": "9:05:28", "remaining_time": "9:34:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1502, "total_steps": 3080, "loss": 0.2663, "learning_rate": 5.615799476237752e-06, "epoch": 0.9748499107577479, "percentage": 48.77, "elapsed_time": "9:06:11", "remaining_time": "9:33:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1504, "total_steps": 3080, "loss": 0.2636, "learning_rate": 5.605142988756917e-06, "epoch": 0.9761479798799286, "percentage": 48.83, "elapsed_time": "9:06:58", "remaining_time": "9:33:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1506, "total_steps": 3080, "loss": 0.2724, "learning_rate": 5.594483710860217e-06, "epoch": 0.9774460490021094, "percentage": 48.9, "elapsed_time": "9:07:38", "remaining_time": "9:32:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1508, "total_steps": 3080, "loss": 0.3434, "learning_rate": 5.583821691699373e-06, "epoch": 0.9787441181242901, "percentage": 48.96, "elapsed_time": "9:08:24", "remaining_time": "9:31:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1510, "total_steps": 3080, "loss": 0.3, "learning_rate": 5.573156980438743e-06, "epoch": 0.9800421872464709, "percentage": 49.03, "elapsed_time": "9:09:00", "remaining_time": "9:30:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1512, "total_steps": 3080, "loss": 0.3051, "learning_rate": 5.562489626255104e-06, "epoch": 0.9813402563686516, "percentage": 49.09, "elapsed_time": "9:09:41", "remaining_time": "9:30:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1514, "total_steps": 3080, "loss": 0.2824, "learning_rate": 5.5518196783374126e-06, "epoch": 0.9826383254908324, "percentage": 49.16, "elapsed_time": "9:10:23", "remaining_time": "9:29:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1516, "total_steps": 3080, "loss": 0.2885, "learning_rate": 5.541147185886591e-06, "epoch": 0.9839363946130132, "percentage": 49.22, "elapsed_time": "9:11:05", "remaining_time": "9:28:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1518, "total_steps": 3080, "loss": 0.2942, "learning_rate": 5.530472198115291e-06, "epoch": 0.9852344637351939, "percentage": 49.29, "elapsed_time": "9:11:44", "remaining_time": "9:27:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1520, "total_steps": 3080, "loss": 0.2877, "learning_rate": 5.519794764247673e-06, "epoch": 0.9865325328573746, "percentage": 49.35, "elapsed_time": "9:12:23", "remaining_time": "9:26:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1522, "total_steps": 3080, "loss": 0.2686, "learning_rate": 5.509114933519179e-06, "epoch": 0.9878306019795554, "percentage": 49.42, "elapsed_time": "9:13:06", "remaining_time": "9:26:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1524, "total_steps": 3080, "loss": 0.2845, "learning_rate": 5.498432755176295e-06, "epoch": 0.9891286711017362, "percentage": 49.48, "elapsed_time": "9:13:49", "remaining_time": "9:25:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1526, "total_steps": 3080, "loss": 0.3064, "learning_rate": 5.487748278476342e-06, "epoch": 0.990426740223917, "percentage": 49.55, "elapsed_time": "9:14:30", "remaining_time": "9:24:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1528, "total_steps": 3080, "loss": 0.2706, "learning_rate": 5.477061552687234e-06, "epoch": 0.9917248093460976, "percentage": 49.61, "elapsed_time": "9:15:06", "remaining_time": "9:23:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1530, "total_steps": 3080, "loss": 0.3087, "learning_rate": 5.466372627087256e-06, "epoch": 0.9930228784682784, "percentage": 49.68, "elapsed_time": "9:15:46", "remaining_time": "9:23:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1532, "total_steps": 3080, "loss": 0.2611, "learning_rate": 5.455681550964839e-06, "epoch": 0.9943209475904592, "percentage": 49.74, "elapsed_time": "9:16:26", "remaining_time": "9:22:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1534, "total_steps": 3080, "loss": 0.27, "learning_rate": 5.4449883736183286e-06, "epoch": 0.99561901671264, "percentage": 49.81, "elapsed_time": "9:17:02", "remaining_time": "9:21:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1536, "total_steps": 3080, "loss": 0.2574, "learning_rate": 5.4342931443557576e-06, "epoch": 0.9969170858348207, "percentage": 49.87, "elapsed_time": "9:17:40", "remaining_time": "9:20:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1538, "total_steps": 3080, "loss": 0.2659, "learning_rate": 5.423595912494626e-06, "epoch": 0.9982151549570014, "percentage": 49.94, "elapsed_time": "9:18:18", "remaining_time": "9:19:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1540, "total_steps": 3080, "loss": 0.2702, "learning_rate": 5.412896727361663e-06, "epoch": 0.9995132240791822, "percentage": 50.0, "elapsed_time": "9:18:59", "remaining_time": "9:18:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1542, "total_steps": 3080, "loss": 0.2835, "learning_rate": 5.402195638292605e-06, "epoch": 1.0008112932013629, "percentage": 50.06, "elapsed_time": "9:19:39", "remaining_time": "9:18:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1544, "total_steps": 3080, "loss": 0.3112, "learning_rate": 5.391492694631975e-06, "epoch": 1.0021093623235438, "percentage": 50.13, "elapsed_time": "9:20:21", "remaining_time": "9:17:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1546, "total_steps": 3080, "loss": 0.2822, "learning_rate": 5.380787945732835e-06, "epoch": 1.0034074314457244, "percentage": 50.19, "elapsed_time": "9:20:58", "remaining_time": "9:16:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1548, "total_steps": 3080, "loss": 0.2594, "learning_rate": 5.370081440956582e-06, "epoch": 1.0047055005679053, "percentage": 50.26, "elapsed_time": "9:21:38", "remaining_time": "9:15:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1550, "total_steps": 3080, "loss": 0.2768, "learning_rate": 5.359373229672708e-06, "epoch": 1.006003569690086, "percentage": 50.32, "elapsed_time": "9:22:17", "remaining_time": "9:15:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1552, "total_steps": 3080, "loss": 0.281, "learning_rate": 5.348663361258568e-06, "epoch": 1.0073016388122666, "percentage": 50.39, "elapsed_time": "9:23:01", "remaining_time": "9:14:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1554, "total_steps": 3080, "loss": 0.2736, "learning_rate": 5.337951885099167e-06, "epoch": 1.0085997079344475, "percentage": 50.45, "elapsed_time": "9:23:40", "remaining_time": "9:13:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1556, "total_steps": 3080, "loss": 0.3052, "learning_rate": 5.327238850586912e-06, "epoch": 1.0098977770566282, "percentage": 50.52, "elapsed_time": "9:24:20", "remaining_time": "9:12:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1558, "total_steps": 3080, "loss": 0.2661, "learning_rate": 5.316524307121409e-06, "epoch": 1.011195846178809, "percentage": 50.58, "elapsed_time": "9:25:05", "remaining_time": "9:12:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1560, "total_steps": 3080, "loss": 0.2632, "learning_rate": 5.3058083041092145e-06, "epoch": 1.0124939153009898, "percentage": 50.65, "elapsed_time": "9:25:43", "remaining_time": "9:11:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1562, "total_steps": 3080, "loss": 0.283, "learning_rate": 5.2950908909636144e-06, "epoch": 1.0137919844231704, "percentage": 50.71, "elapsed_time": "9:26:21", "remaining_time": "9:10:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1564, "total_steps": 3080, "loss": 0.2647, "learning_rate": 5.2843721171044e-06, "epoch": 1.0150900535453513, "percentage": 50.78, "elapsed_time": "9:27:04", "remaining_time": "9:09:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1566, "total_steps": 3080, "loss": 0.2662, "learning_rate": 5.273652031957639e-06, "epoch": 1.016388122667532, "percentage": 50.84, "elapsed_time": "9:27:47", "remaining_time": "9:08:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1568, "total_steps": 3080, "loss": 0.2577, "learning_rate": 5.262930684955439e-06, "epoch": 1.0176861917897129, "percentage": 50.91, "elapsed_time": "9:28:27", "remaining_time": "9:08:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1570, "total_steps": 3080, "loss": 0.2704, "learning_rate": 5.252208125535731e-06, "epoch": 1.0189842609118935, "percentage": 50.97, "elapsed_time": "9:29:05", "remaining_time": "9:07:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1572, "total_steps": 3080, "loss": 0.2933, "learning_rate": 5.241484403142036e-06, "epoch": 1.0202823300340742, "percentage": 51.04, "elapsed_time": "9:29:44", "remaining_time": "9:06:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1574, "total_steps": 3080, "loss": 0.2657, "learning_rate": 5.2307595672232384e-06, "epoch": 1.021580399156255, "percentage": 51.1, "elapsed_time": "9:30:24", "remaining_time": "9:05:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1576, "total_steps": 3080, "loss": 0.2699, "learning_rate": 5.220033667233356e-06, "epoch": 1.0228784682784358, "percentage": 51.17, "elapsed_time": "9:31:08", "remaining_time": "9:05:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1578, "total_steps": 3080, "loss": 0.3055, "learning_rate": 5.209306752631312e-06, "epoch": 1.0241765374006166, "percentage": 51.23, "elapsed_time": "9:31:47", "remaining_time": "9:04:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1580, "total_steps": 3080, "loss": 0.2869, "learning_rate": 5.198578872880709e-06, "epoch": 1.0254746065227973, "percentage": 51.3, "elapsed_time": "9:32:28", "remaining_time": "9:03:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1582, "total_steps": 3080, "loss": 0.302, "learning_rate": 5.187850077449604e-06, "epoch": 1.026772675644978, "percentage": 51.36, "elapsed_time": "9:33:07", "remaining_time": "9:02:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1584, "total_steps": 3080, "loss": 0.3198, "learning_rate": 5.177120415810271e-06, "epoch": 1.0280707447671589, "percentage": 51.43, "elapsed_time": "9:33:49", "remaining_time": "9:01:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1586, "total_steps": 3080, "loss": 0.2843, "learning_rate": 5.1663899374389795e-06, "epoch": 1.0293688138893395, "percentage": 51.49, "elapsed_time": "9:34:30", "remaining_time": "9:01:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1588, "total_steps": 3080, "loss": 0.2572, "learning_rate": 5.155658691815766e-06, "epoch": 1.0306668830115204, "percentage": 51.56, "elapsed_time": "9:35:10", "remaining_time": "9:00:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1590, "total_steps": 3080, "loss": 0.2561, "learning_rate": 5.144926728424205e-06, "epoch": 1.031964952133701, "percentage": 51.62, "elapsed_time": "9:35:52", "remaining_time": "8:59:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1592, "total_steps": 3080, "loss": 0.2466, "learning_rate": 5.134194096751182e-06, "epoch": 1.0332630212558818, "percentage": 51.69, "elapsed_time": "9:36:34", "remaining_time": "8:58:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1594, "total_steps": 3080, "loss": 0.2787, "learning_rate": 5.123460846286661e-06, "epoch": 1.0345610903780627, "percentage": 51.75, "elapsed_time": "9:37:13", "remaining_time": "8:58:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1596, "total_steps": 3080, "loss": 0.3149, "learning_rate": 5.112727026523461e-06, "epoch": 1.0358591595002433, "percentage": 51.82, "elapsed_time": "9:37:54", "remaining_time": "8:57:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1598, "total_steps": 3080, "loss": 0.2801, "learning_rate": 5.101992686957028e-06, "epoch": 1.0371572286224242, "percentage": 51.88, "elapsed_time": "9:38:40", "remaining_time": "8:56:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1600, "total_steps": 3080, "loss": 0.2836, "learning_rate": 5.091257877085201e-06, "epoch": 1.0384552977446049, "percentage": 51.95, "elapsed_time": "9:39:17", "remaining_time": "8:55:50", "throughput": "0.00", "total_tokens": 0}