{"current_steps": 10, "total_steps": 825, "loss": 1.0337, "learning_rate": 5e-06, "epoch": 0.03636363636363636, "percentage": 1.21, "elapsed_time": "0:00:59", "remaining_time": "1:20:44"} {"current_steps": 20, "total_steps": 825, "loss": 0.9092, "learning_rate": 5e-06, "epoch": 0.07272727272727272, "percentage": 2.42, "elapsed_time": "0:01:58", "remaining_time": "1:19:24"} {"current_steps": 30, "total_steps": 825, "loss": 0.8658, "learning_rate": 5e-06, "epoch": 0.10909090909090909, "percentage": 3.64, "elapsed_time": "0:02:57", "remaining_time": "1:18:26"} {"current_steps": 40, "total_steps": 825, "loss": 0.844, "learning_rate": 5e-06, "epoch": 0.14545454545454545, "percentage": 4.85, "elapsed_time": "0:03:57", "remaining_time": "1:17:36"} {"current_steps": 50, "total_steps": 825, "loss": 0.8249, "learning_rate": 5e-06, "epoch": 0.18181818181818182, "percentage": 6.06, "elapsed_time": "0:04:56", "remaining_time": "1:16:38"} {"current_steps": 60, "total_steps": 825, "loss": 0.8068, "learning_rate": 5e-06, "epoch": 0.21818181818181817, "percentage": 7.27, "elapsed_time": "0:05:56", "remaining_time": "1:15:40"} {"current_steps": 70, "total_steps": 825, "loss": 0.7989, "learning_rate": 5e-06, "epoch": 0.2545454545454545, "percentage": 8.48, "elapsed_time": "0:06:55", "remaining_time": "1:14:40"} {"current_steps": 80, "total_steps": 825, "loss": 0.7921, "learning_rate": 5e-06, "epoch": 0.2909090909090909, "percentage": 9.7, "elapsed_time": "0:07:54", "remaining_time": "1:13:40"} {"current_steps": 90, "total_steps": 825, "loss": 0.781, "learning_rate": 5e-06, "epoch": 0.32727272727272727, "percentage": 10.91, "elapsed_time": "0:08:54", "remaining_time": "1:12:41"} {"current_steps": 100, "total_steps": 825, "loss": 0.7745, "learning_rate": 5e-06, "epoch": 0.36363636363636365, "percentage": 12.12, "elapsed_time": "0:09:53", "remaining_time": "1:11:43"} {"current_steps": 110, "total_steps": 825, "loss": 0.7754, "learning_rate": 5e-06, "epoch": 0.4, "percentage": 13.33, "elapsed_time": "0:10:53", "remaining_time": "1:10:46"} {"current_steps": 120, "total_steps": 825, "loss": 0.772, "learning_rate": 5e-06, "epoch": 0.43636363636363634, "percentage": 14.55, "elapsed_time": "0:11:53", "remaining_time": "1:09:53"} {"current_steps": 130, "total_steps": 825, "loss": 0.7686, "learning_rate": 5e-06, "epoch": 0.4727272727272727, "percentage": 15.76, "elapsed_time": "0:12:53", "remaining_time": "1:08:55"} {"current_steps": 140, "total_steps": 825, "loss": 0.7618, "learning_rate": 5e-06, "epoch": 0.509090909090909, "percentage": 16.97, "elapsed_time": "0:13:53", "remaining_time": "1:07:57"} {"current_steps": 150, "total_steps": 825, "loss": 0.7611, "learning_rate": 5e-06, "epoch": 0.5454545454545454, "percentage": 18.18, "elapsed_time": "0:14:52", "remaining_time": "1:06:57"} {"current_steps": 160, "total_steps": 825, "loss": 0.7569, "learning_rate": 5e-06, "epoch": 0.5818181818181818, "percentage": 19.39, "elapsed_time": "0:15:52", "remaining_time": "1:05:57"} {"current_steps": 170, "total_steps": 825, "loss": 0.7611, "learning_rate": 5e-06, "epoch": 0.6181818181818182, "percentage": 20.61, "elapsed_time": "0:16:52", "remaining_time": "1:04:59"} {"current_steps": 180, "total_steps": 825, "loss": 0.7546, "learning_rate": 5e-06, "epoch": 0.6545454545454545, "percentage": 21.82, "elapsed_time": "0:17:51", "remaining_time": "1:03:59"} {"current_steps": 190, "total_steps": 825, "loss": 0.7566, "learning_rate": 5e-06, "epoch": 0.6909090909090909, "percentage": 23.03, "elapsed_time": "0:18:50", "remaining_time": "1:02:58"} {"current_steps": 200, "total_steps": 825, "loss": 0.75, "learning_rate": 5e-06, "epoch": 0.7272727272727273, "percentage": 24.24, "elapsed_time": "0:19:49", "remaining_time": "1:01:57"} {"current_steps": 210, "total_steps": 825, "loss": 0.7476, "learning_rate": 5e-06, "epoch": 0.7636363636363637, "percentage": 25.45, "elapsed_time": "0:20:49", "remaining_time": "1:00:58"} {"current_steps": 220, "total_steps": 825, "loss": 0.7462, "learning_rate": 5e-06, "epoch": 0.8, "percentage": 26.67, "elapsed_time": "0:21:48", "remaining_time": "0:59:59"} {"current_steps": 230, "total_steps": 825, "loss": 0.7411, "learning_rate": 5e-06, "epoch": 0.8363636363636363, "percentage": 27.88, "elapsed_time": "0:22:48", "remaining_time": "0:59:00"} {"current_steps": 240, "total_steps": 825, "loss": 0.7469, "learning_rate": 5e-06, "epoch": 0.8727272727272727, "percentage": 29.09, "elapsed_time": "0:23:47", "remaining_time": "0:58:00"} {"current_steps": 250, "total_steps": 825, "loss": 0.7378, "learning_rate": 5e-06, "epoch": 0.9090909090909091, "percentage": 30.3, "elapsed_time": "0:24:47", "remaining_time": "0:57:00"} {"current_steps": 260, "total_steps": 825, "loss": 0.7457, "learning_rate": 5e-06, "epoch": 0.9454545454545454, "percentage": 31.52, "elapsed_time": "0:25:46", "remaining_time": "0:56:01"} {"current_steps": 270, "total_steps": 825, "loss": 0.7466, "learning_rate": 5e-06, "epoch": 0.9818181818181818, "percentage": 32.73, "elapsed_time": "0:26:46", "remaining_time": "0:55:01"} {"current_steps": 275, "total_steps": 825, "eval_loss": 0.7417545914649963, "epoch": 1.0, "percentage": 33.33, "elapsed_time": "0:27:42", "remaining_time": "0:55:24"} {"current_steps": 280, "total_steps": 825, "loss": 0.7136, "learning_rate": 5e-06, "epoch": 1.018181818181818, "percentage": 33.94, "elapsed_time": "0:29:40", "remaining_time": "0:57:45"} {"current_steps": 290, "total_steps": 825, "loss": 0.6871, "learning_rate": 5e-06, "epoch": 1.0545454545454545, "percentage": 35.15, "elapsed_time": "0:30:39", "remaining_time": "0:56:34"} {"current_steps": 300, "total_steps": 825, "loss": 0.6894, "learning_rate": 5e-06, "epoch": 1.0909090909090908, "percentage": 36.36, "elapsed_time": "0:31:39", "remaining_time": "0:55:24"} {"current_steps": 310, "total_steps": 825, "loss": 0.6935, "learning_rate": 5e-06, "epoch": 1.1272727272727272, "percentage": 37.58, "elapsed_time": "0:32:38", "remaining_time": "0:54:13"} {"current_steps": 320, "total_steps": 825, "loss": 0.6945, "learning_rate": 5e-06, "epoch": 1.1636363636363636, "percentage": 38.79, "elapsed_time": "0:33:38", "remaining_time": "0:53:04"} {"current_steps": 330, "total_steps": 825, "loss": 0.6886, "learning_rate": 5e-06, "epoch": 1.2, "percentage": 40.0, "elapsed_time": "0:34:36", "remaining_time": "0:51:55"} {"current_steps": 340, "total_steps": 825, "loss": 0.6898, "learning_rate": 5e-06, "epoch": 1.2363636363636363, "percentage": 41.21, "elapsed_time": "0:35:36", "remaining_time": "0:50:47"} {"current_steps": 350, "total_steps": 825, "loss": 0.6934, "learning_rate": 5e-06, "epoch": 1.2727272727272727, "percentage": 42.42, "elapsed_time": "0:36:36", "remaining_time": "0:49:41"} {"current_steps": 360, "total_steps": 825, "loss": 0.6922, "learning_rate": 5e-06, "epoch": 1.309090909090909, "percentage": 43.64, "elapsed_time": "0:37:35", "remaining_time": "0:48:33"} {"current_steps": 370, "total_steps": 825, "loss": 0.6912, "learning_rate": 5e-06, "epoch": 1.3454545454545455, "percentage": 44.85, "elapsed_time": "0:38:34", "remaining_time": "0:47:26"} {"current_steps": 380, "total_steps": 825, "loss": 0.6904, "learning_rate": 5e-06, "epoch": 1.3818181818181818, "percentage": 46.06, "elapsed_time": "0:39:34", "remaining_time": "0:46:20"} {"current_steps": 390, "total_steps": 825, "loss": 0.688, "learning_rate": 5e-06, "epoch": 1.4181818181818182, "percentage": 47.27, "elapsed_time": "0:40:33", "remaining_time": "0:45:14"} {"current_steps": 400, "total_steps": 825, "loss": 0.6883, "learning_rate": 5e-06, "epoch": 1.4545454545454546, "percentage": 48.48, "elapsed_time": "0:41:33", "remaining_time": "0:44:08"} {"current_steps": 410, "total_steps": 825, "loss": 0.6934, "learning_rate": 5e-06, "epoch": 1.490909090909091, "percentage": 49.7, "elapsed_time": "0:42:32", "remaining_time": "0:43:03"} {"current_steps": 420, "total_steps": 825, "loss": 0.6916, "learning_rate": 5e-06, "epoch": 1.5272727272727273, "percentage": 50.91, "elapsed_time": "0:43:31", "remaining_time": "0:41:57"} {"current_steps": 430, "total_steps": 825, "loss": 0.6916, "learning_rate": 5e-06, "epoch": 1.5636363636363635, "percentage": 52.12, "elapsed_time": "0:44:30", "remaining_time": "0:40:52"} {"current_steps": 440, "total_steps": 825, "loss": 0.6856, "learning_rate": 5e-06, "epoch": 1.6, "percentage": 53.33, "elapsed_time": "0:45:29", "remaining_time": "0:39:47"} {"current_steps": 450, "total_steps": 825, "loss": 0.6851, "learning_rate": 5e-06, "epoch": 1.6363636363636362, "percentage": 54.55, "elapsed_time": "0:46:28", "remaining_time": "0:38:43"} {"current_steps": 460, "total_steps": 825, "loss": 0.6872, "learning_rate": 5e-06, "epoch": 1.6727272727272728, "percentage": 55.76, "elapsed_time": "0:47:27", "remaining_time": "0:37:39"} {"current_steps": 470, "total_steps": 825, "loss": 0.6849, "learning_rate": 5e-06, "epoch": 1.709090909090909, "percentage": 56.97, "elapsed_time": "0:48:26", "remaining_time": "0:36:35"} {"current_steps": 480, "total_steps": 825, "loss": 0.6891, "learning_rate": 5e-06, "epoch": 1.7454545454545456, "percentage": 58.18, "elapsed_time": "0:49:26", "remaining_time": "0:35:31"} {"current_steps": 490, "total_steps": 825, "loss": 0.6847, "learning_rate": 5e-06, "epoch": 1.7818181818181817, "percentage": 59.39, "elapsed_time": "0:50:25", "remaining_time": "0:34:28"} {"current_steps": 500, "total_steps": 825, "loss": 0.6871, "learning_rate": 5e-06, "epoch": 1.8181818181818183, "percentage": 60.61, "elapsed_time": "0:51:24", "remaining_time": "0:33:24"} {"current_steps": 510, "total_steps": 825, "loss": 0.6888, "learning_rate": 5e-06, "epoch": 1.8545454545454545, "percentage": 61.82, "elapsed_time": "0:52:24", "remaining_time": "0:32:22"} {"current_steps": 520, "total_steps": 825, "loss": 0.6884, "learning_rate": 5e-06, "epoch": 1.8909090909090909, "percentage": 63.03, "elapsed_time": "0:53:23", "remaining_time": "0:31:19"} {"current_steps": 530, "total_steps": 825, "loss": 0.6893, "learning_rate": 5e-06, "epoch": 1.9272727272727272, "percentage": 64.24, "elapsed_time": "0:54:23", "remaining_time": "0:30:16"} {"current_steps": 540, "total_steps": 825, "loss": 0.6868, "learning_rate": 5e-06, "epoch": 1.9636363636363636, "percentage": 65.45, "elapsed_time": "0:55:22", "remaining_time": "0:29:13"} {"current_steps": 550, "total_steps": 825, "loss": 0.6841, "learning_rate": 5e-06, "epoch": 2.0, "percentage": 66.67, "elapsed_time": "0:56:21", "remaining_time": "0:28:10"} {"current_steps": 550, "total_steps": 825, "eval_loss": 0.7281343340873718, "epoch": 2.0, "percentage": 66.67, "elapsed_time": "0:56:48", "remaining_time": "0:28:24"} {"current_steps": 560, "total_steps": 825, "loss": 0.6351, "learning_rate": 5e-06, "epoch": 2.036363636363636, "percentage": 67.88, "elapsed_time": "0:59:27", "remaining_time": "0:28:08"} {"current_steps": 570, "total_steps": 825, "loss": 0.6307, "learning_rate": 5e-06, "epoch": 2.0727272727272728, "percentage": 69.09, "elapsed_time": "1:00:26", "remaining_time": "0:27:02"} {"current_steps": 580, "total_steps": 825, "loss": 0.6357, "learning_rate": 5e-06, "epoch": 2.109090909090909, "percentage": 70.3, "elapsed_time": "1:01:25", "remaining_time": "0:25:56"} {"current_steps": 590, "total_steps": 825, "loss": 0.6375, "learning_rate": 5e-06, "epoch": 2.1454545454545455, "percentage": 71.52, "elapsed_time": "1:02:24", "remaining_time": "0:24:51"} {"current_steps": 600, "total_steps": 825, "loss": 0.635, "learning_rate": 5e-06, "epoch": 2.1818181818181817, "percentage": 72.73, "elapsed_time": "1:03:23", "remaining_time": "0:23:46"} {"current_steps": 610, "total_steps": 825, "loss": 0.6383, "learning_rate": 5e-06, "epoch": 2.2181818181818183, "percentage": 73.94, "elapsed_time": "1:04:22", "remaining_time": "0:22:41"} {"current_steps": 620, "total_steps": 825, "loss": 0.6321, "learning_rate": 5e-06, "epoch": 2.2545454545454544, "percentage": 75.15, "elapsed_time": "1:05:21", "remaining_time": "0:21:36"} {"current_steps": 630, "total_steps": 825, "loss": 0.6341, "learning_rate": 5e-06, "epoch": 2.290909090909091, "percentage": 76.36, "elapsed_time": "1:06:21", "remaining_time": "0:20:32"} {"current_steps": 640, "total_steps": 825, "loss": 0.6326, "learning_rate": 5e-06, "epoch": 2.327272727272727, "percentage": 77.58, "elapsed_time": "1:07:20", "remaining_time": "0:19:27"} {"current_steps": 650, "total_steps": 825, "loss": 0.6385, "learning_rate": 5e-06, "epoch": 2.3636363636363638, "percentage": 78.79, "elapsed_time": "1:08:19", "remaining_time": "0:18:23"} {"current_steps": 660, "total_steps": 825, "loss": 0.6373, "learning_rate": 5e-06, "epoch": 2.4, "percentage": 80.0, "elapsed_time": "1:09:19", "remaining_time": "0:17:19"} {"current_steps": 670, "total_steps": 825, "loss": 0.6399, "learning_rate": 5e-06, "epoch": 2.4363636363636365, "percentage": 81.21, "elapsed_time": "1:10:17", "remaining_time": "0:16:15"} {"current_steps": 680, "total_steps": 825, "loss": 0.6393, "learning_rate": 5e-06, "epoch": 2.4727272727272727, "percentage": 82.42, "elapsed_time": "1:11:16", "remaining_time": "0:15:11"} {"current_steps": 690, "total_steps": 825, "loss": 0.6405, "learning_rate": 5e-06, "epoch": 2.509090909090909, "percentage": 83.64, "elapsed_time": "1:12:15", "remaining_time": "0:14:08"} {"current_steps": 700, "total_steps": 825, "loss": 0.6385, "learning_rate": 5e-06, "epoch": 2.5454545454545454, "percentage": 84.85, "elapsed_time": "1:13:15", "remaining_time": "0:13:04"} {"current_steps": 710, "total_steps": 825, "loss": 0.6377, "learning_rate": 5e-06, "epoch": 2.581818181818182, "percentage": 86.06, "elapsed_time": "1:14:15", "remaining_time": "0:12:01"} {"current_steps": 720, "total_steps": 825, "loss": 0.6427, "learning_rate": 5e-06, "epoch": 2.618181818181818, "percentage": 87.27, "elapsed_time": "1:15:14", "remaining_time": "0:10:58"} {"current_steps": 730, "total_steps": 825, "loss": 0.6346, "learning_rate": 5e-06, "epoch": 2.6545454545454543, "percentage": 88.48, "elapsed_time": "1:16:14", "remaining_time": "0:09:55"} {"current_steps": 740, "total_steps": 825, "loss": 0.6414, "learning_rate": 5e-06, "epoch": 2.690909090909091, "percentage": 89.7, "elapsed_time": "1:17:13", "remaining_time": "0:08:52"} {"current_steps": 750, "total_steps": 825, "loss": 0.6363, "learning_rate": 5e-06, "epoch": 2.7272727272727275, "percentage": 90.91, "elapsed_time": "1:18:13", "remaining_time": "0:07:49"} {"current_steps": 760, "total_steps": 825, "loss": 0.6421, "learning_rate": 5e-06, "epoch": 2.7636363636363637, "percentage": 92.12, "elapsed_time": "1:19:12", "remaining_time": "0:06:46"} {"current_steps": 770, "total_steps": 825, "loss": 0.6356, "learning_rate": 5e-06, "epoch": 2.8, "percentage": 93.33, "elapsed_time": "1:20:10", "remaining_time": "0:05:43"} {"current_steps": 780, "total_steps": 825, "loss": 0.6425, "learning_rate": 5e-06, "epoch": 2.8363636363636364, "percentage": 94.55, "elapsed_time": "1:21:09", "remaining_time": "0:04:40"} {"current_steps": 790, "total_steps": 825, "loss": 0.6368, "learning_rate": 5e-06, "epoch": 2.8727272727272726, "percentage": 95.76, "elapsed_time": "1:22:08", "remaining_time": "0:03:38"} {"current_steps": 800, "total_steps": 825, "loss": 0.6405, "learning_rate": 5e-06, "epoch": 2.909090909090909, "percentage": 96.97, "elapsed_time": "1:23:07", "remaining_time": "0:02:35"} {"current_steps": 810, "total_steps": 825, "loss": 0.6357, "learning_rate": 5e-06, "epoch": 2.9454545454545453, "percentage": 98.18, "elapsed_time": "1:24:07", "remaining_time": "0:01:33"} {"current_steps": 820, "total_steps": 825, "loss": 0.6412, "learning_rate": 5e-06, "epoch": 2.981818181818182, "percentage": 99.39, "elapsed_time": "1:25:06", "remaining_time": "0:00:31"} {"current_steps": 825, "total_steps": 825, "eval_loss": 0.7299705147743225, "epoch": 3.0, "percentage": 100.0, "elapsed_time": "1:27:36", "remaining_time": "0:00:00"} {"current_steps": 825, "total_steps": 825, "epoch": 3.0, "percentage": 100.0, "elapsed_time": "1:29:09", "remaining_time": "0:00:00"}