sedrickkeh's picture
Training in progress, epoch 2
118e260 verified
{"current_steps": 10, "total_steps": 2724, "loss": 0.7008, "learning_rate": 5e-06, "epoch": 0.01100715465052284, "percentage": 0.37, "elapsed_time": "0:01:31", "remaining_time": "6:55:39"}
{"current_steps": 20, "total_steps": 2724, "loss": 0.6366, "learning_rate": 5e-06, "epoch": 0.02201430930104568, "percentage": 0.73, "elapsed_time": "0:02:54", "remaining_time": "6:34:13"}
{"current_steps": 30, "total_steps": 2724, "loss": 0.6043, "learning_rate": 5e-06, "epoch": 0.03302146395156852, "percentage": 1.1, "elapsed_time": "0:04:18", "remaining_time": "6:26:29"}
{"current_steps": 40, "total_steps": 2724, "loss": 0.5955, "learning_rate": 5e-06, "epoch": 0.04402861860209136, "percentage": 1.47, "elapsed_time": "0:05:42", "remaining_time": "6:22:45"}
{"current_steps": 50, "total_steps": 2724, "loss": 0.5702, "learning_rate": 5e-06, "epoch": 0.0550357732526142, "percentage": 1.84, "elapsed_time": "0:07:06", "remaining_time": "6:20:15"}
{"current_steps": 60, "total_steps": 2724, "loss": 0.5644, "learning_rate": 5e-06, "epoch": 0.06604292790313704, "percentage": 2.2, "elapsed_time": "0:08:30", "remaining_time": "6:18:00"}
{"current_steps": 70, "total_steps": 2724, "loss": 0.5613, "learning_rate": 5e-06, "epoch": 0.07705008255365987, "percentage": 2.57, "elapsed_time": "0:09:55", "remaining_time": "6:16:01"}
{"current_steps": 80, "total_steps": 2724, "loss": 0.5517, "learning_rate": 5e-06, "epoch": 0.08805723720418272, "percentage": 2.94, "elapsed_time": "0:11:19", "remaining_time": "6:14:09"}
{"current_steps": 90, "total_steps": 2724, "loss": 0.549, "learning_rate": 5e-06, "epoch": 0.09906439185470556, "percentage": 3.3, "elapsed_time": "0:12:43", "remaining_time": "6:12:22"}
{"current_steps": 100, "total_steps": 2724, "loss": 0.5514, "learning_rate": 5e-06, "epoch": 0.1100715465052284, "percentage": 3.67, "elapsed_time": "0:14:06", "remaining_time": "6:10:18"}
{"current_steps": 110, "total_steps": 2724, "loss": 0.5413, "learning_rate": 5e-06, "epoch": 0.12107870115575124, "percentage": 4.04, "elapsed_time": "0:15:30", "remaining_time": "6:08:23"}
{"current_steps": 120, "total_steps": 2724, "loss": 0.5458, "learning_rate": 5e-06, "epoch": 0.13208585580627408, "percentage": 4.41, "elapsed_time": "0:16:53", "remaining_time": "6:06:37"}
{"current_steps": 130, "total_steps": 2724, "loss": 0.5475, "learning_rate": 5e-06, "epoch": 0.14309301045679693, "percentage": 4.77, "elapsed_time": "0:18:17", "remaining_time": "6:04:54"}
{"current_steps": 140, "total_steps": 2724, "loss": 0.5359, "learning_rate": 5e-06, "epoch": 0.15410016510731975, "percentage": 5.14, "elapsed_time": "0:19:40", "remaining_time": "6:03:12"}
{"current_steps": 150, "total_steps": 2724, "loss": 0.5404, "learning_rate": 5e-06, "epoch": 0.1651073197578426, "percentage": 5.51, "elapsed_time": "0:21:03", "remaining_time": "6:01:29"}
{"current_steps": 160, "total_steps": 2724, "loss": 0.5384, "learning_rate": 5e-06, "epoch": 0.17611447440836545, "percentage": 5.87, "elapsed_time": "0:22:27", "remaining_time": "5:59:51"}
{"current_steps": 170, "total_steps": 2724, "loss": 0.5378, "learning_rate": 5e-06, "epoch": 0.18712162905888827, "percentage": 6.24, "elapsed_time": "0:23:50", "remaining_time": "5:58:09"}
{"current_steps": 180, "total_steps": 2724, "loss": 0.53, "learning_rate": 5e-06, "epoch": 0.19812878370941112, "percentage": 6.61, "elapsed_time": "0:25:13", "remaining_time": "5:56:36"}
{"current_steps": 190, "total_steps": 2724, "loss": 0.5296, "learning_rate": 5e-06, "epoch": 0.20913593835993396, "percentage": 6.98, "elapsed_time": "0:26:37", "remaining_time": "5:55:05"}
{"current_steps": 200, "total_steps": 2724, "loss": 0.538, "learning_rate": 5e-06, "epoch": 0.2201430930104568, "percentage": 7.34, "elapsed_time": "0:28:00", "remaining_time": "5:53:32"}
{"current_steps": 210, "total_steps": 2724, "loss": 0.5249, "learning_rate": 5e-06, "epoch": 0.23115024766097964, "percentage": 7.71, "elapsed_time": "0:29:24", "remaining_time": "5:52:01"}
{"current_steps": 220, "total_steps": 2724, "loss": 0.5243, "learning_rate": 5e-06, "epoch": 0.24215740231150248, "percentage": 8.08, "elapsed_time": "0:30:47", "remaining_time": "5:50:32"}
{"current_steps": 230, "total_steps": 2724, "loss": 0.5213, "learning_rate": 5e-06, "epoch": 0.25316455696202533, "percentage": 8.44, "elapsed_time": "0:32:11", "remaining_time": "5:48:59"}
{"current_steps": 240, "total_steps": 2724, "loss": 0.5241, "learning_rate": 5e-06, "epoch": 0.26417171161254815, "percentage": 8.81, "elapsed_time": "0:33:34", "remaining_time": "5:47:31"}
{"current_steps": 250, "total_steps": 2724, "loss": 0.5214, "learning_rate": 5e-06, "epoch": 0.275178866263071, "percentage": 9.18, "elapsed_time": "0:34:58", "remaining_time": "5:46:09"}
{"current_steps": 260, "total_steps": 2724, "loss": 0.5227, "learning_rate": 5e-06, "epoch": 0.28618602091359385, "percentage": 9.54, "elapsed_time": "0:36:22", "remaining_time": "5:44:41"}
{"current_steps": 270, "total_steps": 2724, "loss": 0.5215, "learning_rate": 5e-06, "epoch": 0.2971931755641167, "percentage": 9.91, "elapsed_time": "0:37:45", "remaining_time": "5:43:11"}
{"current_steps": 280, "total_steps": 2724, "loss": 0.5204, "learning_rate": 5e-06, "epoch": 0.3082003302146395, "percentage": 10.28, "elapsed_time": "0:39:09", "remaining_time": "5:41:47"}
{"current_steps": 290, "total_steps": 2724, "loss": 0.5191, "learning_rate": 5e-06, "epoch": 0.31920748486516237, "percentage": 10.65, "elapsed_time": "0:40:33", "remaining_time": "5:40:24"}
{"current_steps": 300, "total_steps": 2724, "loss": 0.5218, "learning_rate": 5e-06, "epoch": 0.3302146395156852, "percentage": 11.01, "elapsed_time": "0:41:57", "remaining_time": "5:39:01"}
{"current_steps": 310, "total_steps": 2724, "loss": 0.519, "learning_rate": 5e-06, "epoch": 0.341221794166208, "percentage": 11.38, "elapsed_time": "0:43:20", "remaining_time": "5:37:30"}
{"current_steps": 320, "total_steps": 2724, "loss": 0.5123, "learning_rate": 5e-06, "epoch": 0.3522289488167309, "percentage": 11.75, "elapsed_time": "0:44:43", "remaining_time": "5:36:03"}
{"current_steps": 330, "total_steps": 2724, "loss": 0.5173, "learning_rate": 5e-06, "epoch": 0.3632361034672537, "percentage": 12.11, "elapsed_time": "0:46:08", "remaining_time": "5:34:41"}
{"current_steps": 340, "total_steps": 2724, "loss": 0.5118, "learning_rate": 5e-06, "epoch": 0.37424325811777653, "percentage": 12.48, "elapsed_time": "0:47:32", "remaining_time": "5:33:20"}
{"current_steps": 350, "total_steps": 2724, "loss": 0.5098, "learning_rate": 5e-06, "epoch": 0.3852504127682994, "percentage": 12.85, "elapsed_time": "0:48:56", "remaining_time": "5:31:57"}
{"current_steps": 360, "total_steps": 2724, "loss": 0.5094, "learning_rate": 5e-06, "epoch": 0.39625756741882223, "percentage": 13.22, "elapsed_time": "0:50:20", "remaining_time": "5:30:36"}
{"current_steps": 370, "total_steps": 2724, "loss": 0.5123, "learning_rate": 5e-06, "epoch": 0.40726472206934505, "percentage": 13.58, "elapsed_time": "0:51:45", "remaining_time": "5:29:15"}
{"current_steps": 380, "total_steps": 2724, "loss": 0.5118, "learning_rate": 5e-06, "epoch": 0.41827187671986793, "percentage": 13.95, "elapsed_time": "0:53:09", "remaining_time": "5:27:54"}
{"current_steps": 390, "total_steps": 2724, "loss": 0.5103, "learning_rate": 5e-06, "epoch": 0.42927903137039075, "percentage": 14.32, "elapsed_time": "0:54:33", "remaining_time": "5:26:31"}
{"current_steps": 400, "total_steps": 2724, "loss": 0.5057, "learning_rate": 5e-06, "epoch": 0.4402861860209136, "percentage": 14.68, "elapsed_time": "0:55:58", "remaining_time": "5:25:10"}
{"current_steps": 410, "total_steps": 2724, "loss": 0.5105, "learning_rate": 5e-06, "epoch": 0.45129334067143645, "percentage": 15.05, "elapsed_time": "0:57:22", "remaining_time": "5:23:48"}
{"current_steps": 420, "total_steps": 2724, "loss": 0.5057, "learning_rate": 5e-06, "epoch": 0.46230049532195927, "percentage": 15.42, "elapsed_time": "0:58:46", "remaining_time": "5:22:27"}
{"current_steps": 430, "total_steps": 2724, "loss": 0.5076, "learning_rate": 5e-06, "epoch": 0.4733076499724821, "percentage": 15.79, "elapsed_time": "1:00:10", "remaining_time": "5:21:03"}
{"current_steps": 440, "total_steps": 2724, "loss": 0.5091, "learning_rate": 5e-06, "epoch": 0.48431480462300497, "percentage": 16.15, "elapsed_time": "1:01:35", "remaining_time": "5:19:42"}
{"current_steps": 450, "total_steps": 2724, "loss": 0.5042, "learning_rate": 5e-06, "epoch": 0.4953219592735278, "percentage": 16.52, "elapsed_time": "1:02:59", "remaining_time": "5:18:18"}
{"current_steps": 460, "total_steps": 2724, "loss": 0.5021, "learning_rate": 5e-06, "epoch": 0.5063291139240507, "percentage": 16.89, "elapsed_time": "1:04:23", "remaining_time": "5:16:53"}
{"current_steps": 470, "total_steps": 2724, "loss": 0.5031, "learning_rate": 5e-06, "epoch": 0.5173362685745735, "percentage": 17.25, "elapsed_time": "1:05:46", "remaining_time": "5:15:26"}
{"current_steps": 480, "total_steps": 2724, "loss": 0.496, "learning_rate": 5e-06, "epoch": 0.5283434232250963, "percentage": 17.62, "elapsed_time": "1:07:10", "remaining_time": "5:14:01"}
{"current_steps": 490, "total_steps": 2724, "loss": 0.5084, "learning_rate": 5e-06, "epoch": 0.5393505778756191, "percentage": 17.99, "elapsed_time": "1:08:33", "remaining_time": "5:12:35"}
{"current_steps": 500, "total_steps": 2724, "loss": 0.5058, "learning_rate": 5e-06, "epoch": 0.550357732526142, "percentage": 18.36, "elapsed_time": "1:09:57", "remaining_time": "5:11:12"}
{"current_steps": 510, "total_steps": 2724, "loss": 0.5042, "learning_rate": 5e-06, "epoch": 0.5613648871766649, "percentage": 18.72, "elapsed_time": "1:11:22", "remaining_time": "5:09:49"}
{"current_steps": 520, "total_steps": 2724, "loss": 0.4981, "learning_rate": 5e-06, "epoch": 0.5723720418271877, "percentage": 19.09, "elapsed_time": "1:12:46", "remaining_time": "5:08:25"}
{"current_steps": 530, "total_steps": 2724, "loss": 0.5, "learning_rate": 5e-06, "epoch": 0.5833791964777105, "percentage": 19.46, "elapsed_time": "1:14:10", "remaining_time": "5:07:03"}
{"current_steps": 540, "total_steps": 2724, "loss": 0.5058, "learning_rate": 5e-06, "epoch": 0.5943863511282333, "percentage": 19.82, "elapsed_time": "1:15:34", "remaining_time": "5:05:40"}
{"current_steps": 550, "total_steps": 2724, "loss": 0.499, "learning_rate": 5e-06, "epoch": 0.6053935057787562, "percentage": 20.19, "elapsed_time": "1:16:58", "remaining_time": "5:04:16"}
{"current_steps": 560, "total_steps": 2724, "loss": 0.5012, "learning_rate": 5e-06, "epoch": 0.616400660429279, "percentage": 20.56, "elapsed_time": "1:18:22", "remaining_time": "5:02:50"}
{"current_steps": 570, "total_steps": 2724, "loss": 0.4965, "learning_rate": 5e-06, "epoch": 0.6274078150798019, "percentage": 20.93, "elapsed_time": "1:19:45", "remaining_time": "5:01:25"}
{"current_steps": 580, "total_steps": 2724, "loss": 0.5002, "learning_rate": 5e-06, "epoch": 0.6384149697303247, "percentage": 21.29, "elapsed_time": "1:21:09", "remaining_time": "5:00:00"}
{"current_steps": 590, "total_steps": 2724, "loss": 0.5042, "learning_rate": 5e-06, "epoch": 0.6494221243808476, "percentage": 21.66, "elapsed_time": "1:22:33", "remaining_time": "4:58:34"}
{"current_steps": 600, "total_steps": 2724, "loss": 0.5, "learning_rate": 5e-06, "epoch": 0.6604292790313704, "percentage": 22.03, "elapsed_time": "1:23:56", "remaining_time": "4:57:09"}
{"current_steps": 610, "total_steps": 2724, "loss": 0.4956, "learning_rate": 5e-06, "epoch": 0.6714364336818932, "percentage": 22.39, "elapsed_time": "1:25:20", "remaining_time": "4:55:44"}
{"current_steps": 620, "total_steps": 2724, "loss": 0.4923, "learning_rate": 5e-06, "epoch": 0.682443588332416, "percentage": 22.76, "elapsed_time": "1:26:44", "remaining_time": "4:54:21"}
{"current_steps": 630, "total_steps": 2724, "loss": 0.4956, "learning_rate": 5e-06, "epoch": 0.693450742982939, "percentage": 23.13, "elapsed_time": "1:28:08", "remaining_time": "4:52:58"}
{"current_steps": 640, "total_steps": 2724, "loss": 0.4892, "learning_rate": 5e-06, "epoch": 0.7044578976334618, "percentage": 23.49, "elapsed_time": "1:29:32", "remaining_time": "4:51:35"}
{"current_steps": 650, "total_steps": 2724, "loss": 0.5006, "learning_rate": 5e-06, "epoch": 0.7154650522839846, "percentage": 23.86, "elapsed_time": "1:30:57", "remaining_time": "4:50:12"}
{"current_steps": 660, "total_steps": 2724, "loss": 0.4941, "learning_rate": 5e-06, "epoch": 0.7264722069345074, "percentage": 24.23, "elapsed_time": "1:32:21", "remaining_time": "4:48:49"}
{"current_steps": 670, "total_steps": 2724, "loss": 0.5, "learning_rate": 5e-06, "epoch": 0.7374793615850302, "percentage": 24.6, "elapsed_time": "1:33:45", "remaining_time": "4:47:25"}
{"current_steps": 680, "total_steps": 2724, "loss": 0.5022, "learning_rate": 5e-06, "epoch": 0.7484865162355531, "percentage": 24.96, "elapsed_time": "1:35:09", "remaining_time": "4:46:03"}
{"current_steps": 690, "total_steps": 2724, "loss": 0.4968, "learning_rate": 5e-06, "epoch": 0.759493670886076, "percentage": 25.33, "elapsed_time": "1:36:34", "remaining_time": "4:44:40"}
{"current_steps": 700, "total_steps": 2724, "loss": 0.4928, "learning_rate": 5e-06, "epoch": 0.7705008255365988, "percentage": 25.7, "elapsed_time": "1:37:58", "remaining_time": "4:43:17"}
{"current_steps": 710, "total_steps": 2724, "loss": 0.4898, "learning_rate": 5e-06, "epoch": 0.7815079801871216, "percentage": 26.06, "elapsed_time": "1:39:22", "remaining_time": "4:41:54"}
{"current_steps": 720, "total_steps": 2724, "loss": 0.4899, "learning_rate": 5e-06, "epoch": 0.7925151348376445, "percentage": 26.43, "elapsed_time": "1:40:47", "remaining_time": "4:40:31"}
{"current_steps": 730, "total_steps": 2724, "loss": 0.4883, "learning_rate": 5e-06, "epoch": 0.8035222894881673, "percentage": 26.8, "elapsed_time": "1:42:11", "remaining_time": "4:39:08"}
{"current_steps": 740, "total_steps": 2724, "loss": 0.4936, "learning_rate": 5e-06, "epoch": 0.8145294441386901, "percentage": 27.17, "elapsed_time": "1:43:36", "remaining_time": "4:37:45"}
{"current_steps": 750, "total_steps": 2724, "loss": 0.4895, "learning_rate": 5e-06, "epoch": 0.825536598789213, "percentage": 27.53, "elapsed_time": "1:45:00", "remaining_time": "4:36:22"}
{"current_steps": 760, "total_steps": 2724, "loss": 0.4791, "learning_rate": 5e-06, "epoch": 0.8365437534397359, "percentage": 27.9, "elapsed_time": "1:46:23", "remaining_time": "4:34:57"}
{"current_steps": 770, "total_steps": 2724, "loss": 0.492, "learning_rate": 5e-06, "epoch": 0.8475509080902587, "percentage": 28.27, "elapsed_time": "1:47:47", "remaining_time": "4:33:32"}
{"current_steps": 780, "total_steps": 2724, "loss": 0.4938, "learning_rate": 5e-06, "epoch": 0.8585580627407815, "percentage": 28.63, "elapsed_time": "1:49:11", "remaining_time": "4:32:07"}
{"current_steps": 790, "total_steps": 2724, "loss": 0.4914, "learning_rate": 5e-06, "epoch": 0.8695652173913043, "percentage": 29.0, "elapsed_time": "1:50:35", "remaining_time": "4:30:43"}
{"current_steps": 800, "total_steps": 2724, "loss": 0.4876, "learning_rate": 5e-06, "epoch": 0.8805723720418271, "percentage": 29.37, "elapsed_time": "1:51:58", "remaining_time": "4:29:18"}
{"current_steps": 810, "total_steps": 2724, "loss": 0.49, "learning_rate": 5e-06, "epoch": 0.8915795266923501, "percentage": 29.74, "elapsed_time": "1:53:21", "remaining_time": "4:27:52"}
{"current_steps": 820, "total_steps": 2724, "loss": 0.4873, "learning_rate": 5e-06, "epoch": 0.9025866813428729, "percentage": 30.1, "elapsed_time": "1:54:45", "remaining_time": "4:26:27"}
{"current_steps": 830, "total_steps": 2724, "loss": 0.4876, "learning_rate": 5e-06, "epoch": 0.9135938359933957, "percentage": 30.47, "elapsed_time": "1:56:08", "remaining_time": "4:25:02"}
{"current_steps": 840, "total_steps": 2724, "loss": 0.4835, "learning_rate": 5e-06, "epoch": 0.9246009906439185, "percentage": 30.84, "elapsed_time": "1:57:32", "remaining_time": "4:23:37"}
{"current_steps": 850, "total_steps": 2724, "loss": 0.4856, "learning_rate": 5e-06, "epoch": 0.9356081452944414, "percentage": 31.2, "elapsed_time": "1:58:55", "remaining_time": "4:22:12"}
{"current_steps": 860, "total_steps": 2724, "loss": 0.4893, "learning_rate": 5e-06, "epoch": 0.9466152999449642, "percentage": 31.57, "elapsed_time": "2:00:18", "remaining_time": "4:20:46"}
{"current_steps": 870, "total_steps": 2724, "loss": 0.4861, "learning_rate": 5e-06, "epoch": 0.9576224545954871, "percentage": 31.94, "elapsed_time": "2:01:42", "remaining_time": "4:19:21"}
{"current_steps": 880, "total_steps": 2724, "loss": 0.4866, "learning_rate": 5e-06, "epoch": 0.9686296092460099, "percentage": 32.31, "elapsed_time": "2:03:05", "remaining_time": "4:17:56"}
{"current_steps": 890, "total_steps": 2724, "loss": 0.4871, "learning_rate": 5e-06, "epoch": 0.9796367638965328, "percentage": 32.67, "elapsed_time": "2:04:29", "remaining_time": "4:16:31"}
{"current_steps": 900, "total_steps": 2724, "loss": 0.4817, "learning_rate": 5e-06, "epoch": 0.9906439185470556, "percentage": 33.04, "elapsed_time": "2:05:52", "remaining_time": "4:15:06"}
{"current_steps": 908, "total_steps": 2724, "eval_loss": 0.4857633411884308, "epoch": 0.9994496422674739, "percentage": 33.33, "elapsed_time": "2:09:41", "remaining_time": "4:19:23"}
{"current_steps": 910, "total_steps": 2724, "loss": 0.4812, "learning_rate": 5e-06, "epoch": 1.0016510731975785, "percentage": 33.41, "elapsed_time": "2:10:46", "remaining_time": "4:20:41"}
{"current_steps": 920, "total_steps": 2724, "loss": 0.4395, "learning_rate": 5e-06, "epoch": 1.0126582278481013, "percentage": 33.77, "elapsed_time": "2:12:09", "remaining_time": "4:19:08"}
{"current_steps": 930, "total_steps": 2724, "loss": 0.4379, "learning_rate": 5e-06, "epoch": 1.0236653824986242, "percentage": 34.14, "elapsed_time": "2:13:32", "remaining_time": "4:17:35"}
{"current_steps": 940, "total_steps": 2724, "loss": 0.4388, "learning_rate": 5e-06, "epoch": 1.034672537149147, "percentage": 34.51, "elapsed_time": "2:14:55", "remaining_time": "4:16:03"}
{"current_steps": 950, "total_steps": 2724, "loss": 0.4374, "learning_rate": 5e-06, "epoch": 1.0456796917996698, "percentage": 34.88, "elapsed_time": "2:16:18", "remaining_time": "4:14:32"}
{"current_steps": 960, "total_steps": 2724, "loss": 0.4358, "learning_rate": 5e-06, "epoch": 1.0566868464501926, "percentage": 35.24, "elapsed_time": "2:17:42", "remaining_time": "4:13:01"}
{"current_steps": 970, "total_steps": 2724, "loss": 0.4359, "learning_rate": 5e-06, "epoch": 1.0676940011007154, "percentage": 35.61, "elapsed_time": "2:19:05", "remaining_time": "4:11:31"}
{"current_steps": 980, "total_steps": 2724, "loss": 0.4383, "learning_rate": 5e-06, "epoch": 1.0787011557512383, "percentage": 35.98, "elapsed_time": "2:20:29", "remaining_time": "4:10:01"}
{"current_steps": 990, "total_steps": 2724, "loss": 0.4385, "learning_rate": 5e-06, "epoch": 1.089708310401761, "percentage": 36.34, "elapsed_time": "2:21:53", "remaining_time": "4:08:30"}
{"current_steps": 1000, "total_steps": 2724, "loss": 0.4405, "learning_rate": 5e-06, "epoch": 1.100715465052284, "percentage": 36.71, "elapsed_time": "2:23:16", "remaining_time": "4:07:00"}
{"current_steps": 1010, "total_steps": 2724, "loss": 0.4371, "learning_rate": 5e-06, "epoch": 1.1117226197028067, "percentage": 37.08, "elapsed_time": "2:24:39", "remaining_time": "4:05:29"}
{"current_steps": 1020, "total_steps": 2724, "loss": 0.4345, "learning_rate": 5e-06, "epoch": 1.1227297743533298, "percentage": 37.44, "elapsed_time": "2:26:02", "remaining_time": "4:03:58"}
{"current_steps": 1030, "total_steps": 2724, "loss": 0.4405, "learning_rate": 5e-06, "epoch": 1.1337369290038526, "percentage": 37.81, "elapsed_time": "2:27:25", "remaining_time": "4:02:28"}
{"current_steps": 1040, "total_steps": 2724, "loss": 0.4381, "learning_rate": 5e-06, "epoch": 1.1447440836543754, "percentage": 38.18, "elapsed_time": "2:28:49", "remaining_time": "4:00:58"}
{"current_steps": 1050, "total_steps": 2724, "loss": 0.4387, "learning_rate": 5e-06, "epoch": 1.1557512383048982, "percentage": 38.55, "elapsed_time": "2:30:12", "remaining_time": "3:59:28"}
{"current_steps": 1060, "total_steps": 2724, "loss": 0.4422, "learning_rate": 5e-06, "epoch": 1.166758392955421, "percentage": 38.91, "elapsed_time": "2:31:35", "remaining_time": "3:57:58"}
{"current_steps": 1070, "total_steps": 2724, "loss": 0.4341, "learning_rate": 5e-06, "epoch": 1.1777655476059439, "percentage": 39.28, "elapsed_time": "2:32:59", "remaining_time": "3:56:29"}
{"current_steps": 1080, "total_steps": 2724, "loss": 0.4353, "learning_rate": 5e-06, "epoch": 1.1887727022564667, "percentage": 39.65, "elapsed_time": "2:34:22", "remaining_time": "3:55:00"}
{"current_steps": 1090, "total_steps": 2724, "loss": 0.4425, "learning_rate": 5e-06, "epoch": 1.1997798569069895, "percentage": 40.01, "elapsed_time": "2:35:46", "remaining_time": "3:53:31"}
{"current_steps": 1100, "total_steps": 2724, "loss": 0.4376, "learning_rate": 5e-06, "epoch": 1.2107870115575123, "percentage": 40.38, "elapsed_time": "2:37:09", "remaining_time": "3:52:01"}
{"current_steps": 1110, "total_steps": 2724, "loss": 0.4323, "learning_rate": 5e-06, "epoch": 1.2217941662080352, "percentage": 40.75, "elapsed_time": "2:38:33", "remaining_time": "3:50:33"}
{"current_steps": 1120, "total_steps": 2724, "loss": 0.4394, "learning_rate": 5e-06, "epoch": 1.232801320858558, "percentage": 41.12, "elapsed_time": "2:39:57", "remaining_time": "3:49:04"}
{"current_steps": 1130, "total_steps": 2724, "loss": 0.4395, "learning_rate": 5e-06, "epoch": 1.243808475509081, "percentage": 41.48, "elapsed_time": "2:41:20", "remaining_time": "3:47:36"}
{"current_steps": 1140, "total_steps": 2724, "loss": 0.4361, "learning_rate": 5e-06, "epoch": 1.2548156301596038, "percentage": 41.85, "elapsed_time": "2:42:44", "remaining_time": "3:46:07"}
{"current_steps": 1150, "total_steps": 2724, "loss": 0.4359, "learning_rate": 5e-06, "epoch": 1.2658227848101267, "percentage": 42.22, "elapsed_time": "2:44:07", "remaining_time": "3:44:38"}
{"current_steps": 1160, "total_steps": 2724, "loss": 0.4381, "learning_rate": 5e-06, "epoch": 1.2768299394606495, "percentage": 42.58, "elapsed_time": "2:45:31", "remaining_time": "3:43:09"}
{"current_steps": 1170, "total_steps": 2724, "loss": 0.4375, "learning_rate": 5e-06, "epoch": 1.2878370941111723, "percentage": 42.95, "elapsed_time": "2:46:54", "remaining_time": "3:41:41"}
{"current_steps": 1180, "total_steps": 2724, "loss": 0.44, "learning_rate": 5e-06, "epoch": 1.2988442487616951, "percentage": 43.32, "elapsed_time": "2:48:17", "remaining_time": "3:40:12"}
{"current_steps": 1190, "total_steps": 2724, "loss": 0.4321, "learning_rate": 5e-06, "epoch": 1.309851403412218, "percentage": 43.69, "elapsed_time": "2:49:41", "remaining_time": "3:38:44"}
{"current_steps": 1200, "total_steps": 2724, "loss": 0.4391, "learning_rate": 5e-06, "epoch": 1.3208585580627408, "percentage": 44.05, "elapsed_time": "2:51:04", "remaining_time": "3:37:16"}
{"current_steps": 1210, "total_steps": 2724, "loss": 0.4299, "learning_rate": 5e-06, "epoch": 1.3318657127132636, "percentage": 44.42, "elapsed_time": "2:52:28", "remaining_time": "3:35:47"}
{"current_steps": 1220, "total_steps": 2724, "loss": 0.4401, "learning_rate": 5e-06, "epoch": 1.3428728673637864, "percentage": 44.79, "elapsed_time": "2:53:51", "remaining_time": "3:34:19"}
{"current_steps": 1230, "total_steps": 2724, "loss": 0.4368, "learning_rate": 5e-06, "epoch": 1.3538800220143092, "percentage": 45.15, "elapsed_time": "2:55:14", "remaining_time": "3:32:51"}
{"current_steps": 1240, "total_steps": 2724, "loss": 0.4382, "learning_rate": 5e-06, "epoch": 1.364887176664832, "percentage": 45.52, "elapsed_time": "2:56:38", "remaining_time": "3:31:24"}
{"current_steps": 1250, "total_steps": 2724, "loss": 0.4418, "learning_rate": 5e-06, "epoch": 1.3758943313153549, "percentage": 45.89, "elapsed_time": "2:58:02", "remaining_time": "3:29:56"}
{"current_steps": 1260, "total_steps": 2724, "loss": 0.4402, "learning_rate": 5e-06, "epoch": 1.3869014859658777, "percentage": 46.26, "elapsed_time": "2:59:26", "remaining_time": "3:28:30"}
{"current_steps": 1270, "total_steps": 2724, "loss": 0.4384, "learning_rate": 5e-06, "epoch": 1.3979086406164005, "percentage": 46.62, "elapsed_time": "3:00:51", "remaining_time": "3:27:03"}
{"current_steps": 1280, "total_steps": 2724, "loss": 0.4358, "learning_rate": 5e-06, "epoch": 1.4089157952669236, "percentage": 46.99, "elapsed_time": "3:02:14", "remaining_time": "3:25:35"}
{"current_steps": 1290, "total_steps": 2724, "loss": 0.4366, "learning_rate": 5e-06, "epoch": 1.4199229499174464, "percentage": 47.36, "elapsed_time": "3:03:38", "remaining_time": "3:24:08"}
{"current_steps": 1300, "total_steps": 2724, "loss": 0.4333, "learning_rate": 5e-06, "epoch": 1.4309301045679692, "percentage": 47.72, "elapsed_time": "3:05:02", "remaining_time": "3:22:41"}
{"current_steps": 1310, "total_steps": 2724, "loss": 0.4307, "learning_rate": 5e-06, "epoch": 1.441937259218492, "percentage": 48.09, "elapsed_time": "3:06:26", "remaining_time": "3:21:14"}
{"current_steps": 1320, "total_steps": 2724, "loss": 0.4375, "learning_rate": 5e-06, "epoch": 1.4529444138690149, "percentage": 48.46, "elapsed_time": "3:07:49", "remaining_time": "3:19:46"}
{"current_steps": 1330, "total_steps": 2724, "loss": 0.4318, "learning_rate": 5e-06, "epoch": 1.4639515685195377, "percentage": 48.83, "elapsed_time": "3:09:13", "remaining_time": "3:18:19"}
{"current_steps": 1340, "total_steps": 2724, "loss": 0.4395, "learning_rate": 5e-06, "epoch": 1.4749587231700605, "percentage": 49.19, "elapsed_time": "3:10:36", "remaining_time": "3:16:52"}
{"current_steps": 1350, "total_steps": 2724, "loss": 0.4343, "learning_rate": 5e-06, "epoch": 1.4859658778205833, "percentage": 49.56, "elapsed_time": "3:12:00", "remaining_time": "3:15:25"}
{"current_steps": 1360, "total_steps": 2724, "loss": 0.4358, "learning_rate": 5e-06, "epoch": 1.4969730324711064, "percentage": 49.93, "elapsed_time": "3:13:24", "remaining_time": "3:13:58"}
{"current_steps": 1370, "total_steps": 2724, "loss": 0.4365, "learning_rate": 5e-06, "epoch": 1.5079801871216292, "percentage": 50.29, "elapsed_time": "3:14:47", "remaining_time": "3:12:30"}
{"current_steps": 1380, "total_steps": 2724, "loss": 0.4387, "learning_rate": 5e-06, "epoch": 1.518987341772152, "percentage": 50.66, "elapsed_time": "3:16:10", "remaining_time": "3:11:03"}
{"current_steps": 1390, "total_steps": 2724, "loss": 0.4275, "learning_rate": 5e-06, "epoch": 1.5299944964226748, "percentage": 51.03, "elapsed_time": "3:17:34", "remaining_time": "3:09:37"}
{"current_steps": 1400, "total_steps": 2724, "loss": 0.4302, "learning_rate": 5e-06, "epoch": 1.5410016510731976, "percentage": 51.4, "elapsed_time": "3:18:59", "remaining_time": "3:08:10"}
{"current_steps": 1410, "total_steps": 2724, "loss": 0.4344, "learning_rate": 5e-06, "epoch": 1.5520088057237205, "percentage": 51.76, "elapsed_time": "3:20:23", "remaining_time": "3:06:44"}
{"current_steps": 1420, "total_steps": 2724, "loss": 0.4366, "learning_rate": 5e-06, "epoch": 1.5630159603742433, "percentage": 52.13, "elapsed_time": "3:21:47", "remaining_time": "3:05:18"}
{"current_steps": 1430, "total_steps": 2724, "loss": 0.4353, "learning_rate": 5e-06, "epoch": 1.574023115024766, "percentage": 52.5, "elapsed_time": "3:23:11", "remaining_time": "3:03:51"}
{"current_steps": 1440, "total_steps": 2724, "loss": 0.4332, "learning_rate": 5e-06, "epoch": 1.585030269675289, "percentage": 52.86, "elapsed_time": "3:24:35", "remaining_time": "3:02:25"}
{"current_steps": 1450, "total_steps": 2724, "loss": 0.4297, "learning_rate": 5e-06, "epoch": 1.5960374243258117, "percentage": 53.23, "elapsed_time": "3:25:59", "remaining_time": "3:00:59"}
{"current_steps": 1460, "total_steps": 2724, "loss": 0.4369, "learning_rate": 5e-06, "epoch": 1.6070445789763346, "percentage": 53.6, "elapsed_time": "3:27:23", "remaining_time": "2:59:33"}
{"current_steps": 1470, "total_steps": 2724, "loss": 0.4364, "learning_rate": 5e-06, "epoch": 1.6180517336268574, "percentage": 53.96, "elapsed_time": "3:28:47", "remaining_time": "2:58:06"}
{"current_steps": 1480, "total_steps": 2724, "loss": 0.4313, "learning_rate": 5e-06, "epoch": 1.6290588882773802, "percentage": 54.33, "elapsed_time": "3:30:11", "remaining_time": "2:56:40"}
{"current_steps": 1490, "total_steps": 2724, "loss": 0.4314, "learning_rate": 5e-06, "epoch": 1.640066042927903, "percentage": 54.7, "elapsed_time": "3:31:35", "remaining_time": "2:55:14"}
{"current_steps": 1500, "total_steps": 2724, "loss": 0.4334, "learning_rate": 5e-06, "epoch": 1.6510731975784259, "percentage": 55.07, "elapsed_time": "3:32:59", "remaining_time": "2:53:48"}
{"current_steps": 1510, "total_steps": 2724, "loss": 0.4332, "learning_rate": 5e-06, "epoch": 1.6620803522289487, "percentage": 55.43, "elapsed_time": "3:34:23", "remaining_time": "2:52:21"}
{"current_steps": 1520, "total_steps": 2724, "loss": 0.4326, "learning_rate": 5e-06, "epoch": 1.6730875068794715, "percentage": 55.8, "elapsed_time": "3:35:46", "remaining_time": "2:50:55"}
{"current_steps": 1530, "total_steps": 2724, "loss": 0.4366, "learning_rate": 5e-06, "epoch": 1.6840946615299945, "percentage": 56.17, "elapsed_time": "3:37:10", "remaining_time": "2:49:28"}
{"current_steps": 1540, "total_steps": 2724, "loss": 0.4316, "learning_rate": 5e-06, "epoch": 1.6951018161805174, "percentage": 56.53, "elapsed_time": "3:38:36", "remaining_time": "2:48:04"}
{"current_steps": 1550, "total_steps": 2724, "loss": 0.431, "learning_rate": 5e-06, "epoch": 1.7061089708310402, "percentage": 56.9, "elapsed_time": "3:39:59", "remaining_time": "2:46:37"}
{"current_steps": 1560, "total_steps": 2724, "loss": 0.4359, "learning_rate": 5e-06, "epoch": 1.717116125481563, "percentage": 57.27, "elapsed_time": "3:41:22", "remaining_time": "2:45:10"}
{"current_steps": 1570, "total_steps": 2724, "loss": 0.4332, "learning_rate": 5e-06, "epoch": 1.7281232801320858, "percentage": 57.64, "elapsed_time": "3:42:44", "remaining_time": "2:43:43"}
{"current_steps": 1580, "total_steps": 2724, "loss": 0.4295, "learning_rate": 5e-06, "epoch": 1.7391304347826086, "percentage": 58.0, "elapsed_time": "3:44:07", "remaining_time": "2:42:16"}
{"current_steps": 1590, "total_steps": 2724, "loss": 0.4366, "learning_rate": 5e-06, "epoch": 1.7501375894331317, "percentage": 58.37, "elapsed_time": "3:45:31", "remaining_time": "2:40:50"}
{"current_steps": 1600, "total_steps": 2724, "loss": 0.4298, "learning_rate": 5e-06, "epoch": 1.7611447440836545, "percentage": 58.74, "elapsed_time": "3:46:54", "remaining_time": "2:39:24"}
{"current_steps": 1610, "total_steps": 2724, "loss": 0.43, "learning_rate": 5e-06, "epoch": 1.7721518987341773, "percentage": 59.1, "elapsed_time": "3:48:18", "remaining_time": "2:37:58"}
{"current_steps": 1620, "total_steps": 2724, "loss": 0.43, "learning_rate": 5e-06, "epoch": 1.7831590533847002, "percentage": 59.47, "elapsed_time": "3:49:41", "remaining_time": "2:36:32"}
{"current_steps": 1630, "total_steps": 2724, "loss": 0.432, "learning_rate": 5e-06, "epoch": 1.794166208035223, "percentage": 59.84, "elapsed_time": "3:51:05", "remaining_time": "2:35:06"}
{"current_steps": 1640, "total_steps": 2724, "loss": 0.4339, "learning_rate": 5e-06, "epoch": 1.8051733626857458, "percentage": 60.21, "elapsed_time": "3:52:28", "remaining_time": "2:33:39"}
{"current_steps": 1650, "total_steps": 2724, "loss": 0.4372, "learning_rate": 5e-06, "epoch": 1.8161805173362686, "percentage": 60.57, "elapsed_time": "3:53:51", "remaining_time": "2:32:13"}
{"current_steps": 1660, "total_steps": 2724, "loss": 0.4374, "learning_rate": 5e-06, "epoch": 1.8271876719867914, "percentage": 60.94, "elapsed_time": "3:55:15", "remaining_time": "2:30:47"}
{"current_steps": 1670, "total_steps": 2724, "loss": 0.4271, "learning_rate": 5e-06, "epoch": 1.8381948266373143, "percentage": 61.31, "elapsed_time": "3:56:38", "remaining_time": "2:29:21"}
{"current_steps": 1680, "total_steps": 2724, "loss": 0.4297, "learning_rate": 5e-06, "epoch": 1.849201981287837, "percentage": 61.67, "elapsed_time": "3:58:01", "remaining_time": "2:27:55"}
{"current_steps": 1690, "total_steps": 2724, "loss": 0.436, "learning_rate": 5e-06, "epoch": 1.86020913593836, "percentage": 62.04, "elapsed_time": "3:59:25", "remaining_time": "2:26:29"}
{"current_steps": 1700, "total_steps": 2724, "loss": 0.4381, "learning_rate": 5e-06, "epoch": 1.8712162905888827, "percentage": 62.41, "elapsed_time": "4:00:48", "remaining_time": "2:25:03"}
{"current_steps": 1710, "total_steps": 2724, "loss": 0.4315, "learning_rate": 5e-06, "epoch": 1.8822234452394055, "percentage": 62.78, "elapsed_time": "4:02:12", "remaining_time": "2:23:37"}
{"current_steps": 1720, "total_steps": 2724, "loss": 0.4337, "learning_rate": 5e-06, "epoch": 1.8932305998899284, "percentage": 63.14, "elapsed_time": "4:03:35", "remaining_time": "2:22:11"}
{"current_steps": 1730, "total_steps": 2724, "loss": 0.4297, "learning_rate": 5e-06, "epoch": 1.9042377545404512, "percentage": 63.51, "elapsed_time": "4:04:59", "remaining_time": "2:20:45"}
{"current_steps": 1740, "total_steps": 2724, "loss": 0.4307, "learning_rate": 5e-06, "epoch": 1.915244909190974, "percentage": 63.88, "elapsed_time": "4:06:22", "remaining_time": "2:19:20"}
{"current_steps": 1750, "total_steps": 2724, "loss": 0.4295, "learning_rate": 5e-06, "epoch": 1.9262520638414968, "percentage": 64.24, "elapsed_time": "4:07:46", "remaining_time": "2:17:54"}
{"current_steps": 1760, "total_steps": 2724, "loss": 0.4276, "learning_rate": 5e-06, "epoch": 1.9372592184920197, "percentage": 64.61, "elapsed_time": "4:09:09", "remaining_time": "2:16:28"}
{"current_steps": 1770, "total_steps": 2724, "loss": 0.4306, "learning_rate": 5e-06, "epoch": 1.9482663731425427, "percentage": 64.98, "elapsed_time": "4:10:33", "remaining_time": "2:15:02"}
{"current_steps": 1780, "total_steps": 2724, "loss": 0.428, "learning_rate": 5e-06, "epoch": 1.9592735277930655, "percentage": 65.35, "elapsed_time": "4:11:56", "remaining_time": "2:13:37"}
{"current_steps": 1790, "total_steps": 2724, "loss": 0.4303, "learning_rate": 5e-06, "epoch": 1.9702806824435883, "percentage": 65.71, "elapsed_time": "4:13:20", "remaining_time": "2:12:11"}
{"current_steps": 1800, "total_steps": 2724, "loss": 0.4295, "learning_rate": 5e-06, "epoch": 1.9812878370941112, "percentage": 66.08, "elapsed_time": "4:14:44", "remaining_time": "2:10:46"}
{"current_steps": 1810, "total_steps": 2724, "loss": 0.4298, "learning_rate": 5e-06, "epoch": 1.992294991744634, "percentage": 66.45, "elapsed_time": "4:16:07", "remaining_time": "2:09:20"}
{"current_steps": 1817, "total_steps": 2724, "eval_loss": 0.4725576341152191, "epoch": 2.0, "percentage": 66.7, "elapsed_time": "4:19:46", "remaining_time": "2:09:40"}
{"current_steps": 1820, "total_steps": 2724, "loss": 0.4167, "learning_rate": 5e-06, "epoch": 2.003302146395157, "percentage": 66.81, "elapsed_time": "4:21:11", "remaining_time": "2:09:43"}
{"current_steps": 1830, "total_steps": 2724, "loss": 0.3791, "learning_rate": 5e-06, "epoch": 2.01430930104568, "percentage": 67.18, "elapsed_time": "4:22:33", "remaining_time": "2:08:16"}