sedrickkeh's picture
Training in progress, epoch 2
3f0454d verified
{"current_steps": 10, "total_steps": 921, "loss": 0.822, "learning_rate": 5e-06, "epoch": 0.03249390739236393, "percentage": 1.09, "elapsed_time": "0:02:49", "remaining_time": "4:17:31"}
{"current_steps": 20, "total_steps": 921, "loss": 0.7337, "learning_rate": 5e-06, "epoch": 0.06498781478472786, "percentage": 2.17, "elapsed_time": "0:05:32", "remaining_time": "4:09:48"}
{"current_steps": 30, "total_steps": 921, "loss": 0.7074, "learning_rate": 5e-06, "epoch": 0.09748172217709179, "percentage": 3.26, "elapsed_time": "0:08:15", "remaining_time": "4:05:07"}
{"current_steps": 40, "total_steps": 921, "loss": 0.6975, "learning_rate": 5e-06, "epoch": 0.12997562956945571, "percentage": 4.34, "elapsed_time": "0:10:56", "remaining_time": "4:00:57"}
{"current_steps": 50, "total_steps": 921, "loss": 0.6824, "learning_rate": 5e-06, "epoch": 0.16246953696181965, "percentage": 5.43, "elapsed_time": "0:13:37", "remaining_time": "3:57:12"}
{"current_steps": 60, "total_steps": 921, "loss": 0.6687, "learning_rate": 5e-06, "epoch": 0.19496344435418358, "percentage": 6.51, "elapsed_time": "0:16:17", "remaining_time": "3:53:47"}
{"current_steps": 70, "total_steps": 921, "loss": 0.6663, "learning_rate": 5e-06, "epoch": 0.22745735174654752, "percentage": 7.6, "elapsed_time": "0:18:57", "remaining_time": "3:50:34"}
{"current_steps": 80, "total_steps": 921, "loss": 0.651, "learning_rate": 5e-06, "epoch": 0.25995125913891143, "percentage": 8.69, "elapsed_time": "0:21:38", "remaining_time": "3:47:30"}
{"current_steps": 90, "total_steps": 921, "loss": 0.6586, "learning_rate": 5e-06, "epoch": 0.2924451665312754, "percentage": 9.77, "elapsed_time": "0:24:20", "remaining_time": "3:44:43"}
{"current_steps": 100, "total_steps": 921, "loss": 0.6473, "learning_rate": 5e-06, "epoch": 0.3249390739236393, "percentage": 10.86, "elapsed_time": "0:27:02", "remaining_time": "3:41:57"}
{"current_steps": 110, "total_steps": 921, "loss": 0.6511, "learning_rate": 5e-06, "epoch": 0.35743298131600326, "percentage": 11.94, "elapsed_time": "0:29:45", "remaining_time": "3:39:21"}
{"current_steps": 120, "total_steps": 921, "loss": 0.6441, "learning_rate": 5e-06, "epoch": 0.38992688870836717, "percentage": 13.03, "elapsed_time": "0:32:27", "remaining_time": "3:36:37"}
{"current_steps": 130, "total_steps": 921, "loss": 0.6543, "learning_rate": 5e-06, "epoch": 0.42242079610073113, "percentage": 14.12, "elapsed_time": "0:35:09", "remaining_time": "3:33:53"}
{"current_steps": 140, "total_steps": 921, "loss": 0.6445, "learning_rate": 5e-06, "epoch": 0.45491470349309504, "percentage": 15.2, "elapsed_time": "0:37:50", "remaining_time": "3:31:08"}
{"current_steps": 150, "total_steps": 921, "loss": 0.6364, "learning_rate": 5e-06, "epoch": 0.487408610885459, "percentage": 16.29, "elapsed_time": "0:40:34", "remaining_time": "3:28:32"}
{"current_steps": 160, "total_steps": 921, "loss": 0.6325, "learning_rate": 5e-06, "epoch": 0.5199025182778229, "percentage": 17.37, "elapsed_time": "0:43:17", "remaining_time": "3:25:55"}
{"current_steps": 170, "total_steps": 921, "loss": 0.631, "learning_rate": 5e-06, "epoch": 0.5523964256701869, "percentage": 18.46, "elapsed_time": "0:46:00", "remaining_time": "3:23:16"}
{"current_steps": 180, "total_steps": 921, "loss": 0.629, "learning_rate": 5e-06, "epoch": 0.5848903330625508, "percentage": 19.54, "elapsed_time": "0:48:42", "remaining_time": "3:20:32"}
{"current_steps": 190, "total_steps": 921, "loss": 0.6383, "learning_rate": 5e-06, "epoch": 0.6173842404549147, "percentage": 20.63, "elapsed_time": "0:51:24", "remaining_time": "3:17:48"}
{"current_steps": 200, "total_steps": 921, "loss": 0.6277, "learning_rate": 5e-06, "epoch": 0.6498781478472786, "percentage": 21.72, "elapsed_time": "0:54:07", "remaining_time": "3:15:08"}
{"current_steps": 210, "total_steps": 921, "loss": 0.6287, "learning_rate": 5e-06, "epoch": 0.6823720552396426, "percentage": 22.8, "elapsed_time": "0:56:49", "remaining_time": "3:12:25"}
{"current_steps": 220, "total_steps": 921, "loss": 0.6358, "learning_rate": 5e-06, "epoch": 0.7148659626320065, "percentage": 23.89, "elapsed_time": "0:59:32", "remaining_time": "3:09:42"}
{"current_steps": 230, "total_steps": 921, "loss": 0.6331, "learning_rate": 5e-06, "epoch": 0.7473598700243704, "percentage": 24.97, "elapsed_time": "1:02:14", "remaining_time": "3:06:59"}
{"current_steps": 240, "total_steps": 921, "loss": 0.6224, "learning_rate": 5e-06, "epoch": 0.7798537774167343, "percentage": 26.06, "elapsed_time": "1:04:56", "remaining_time": "3:04:15"}
{"current_steps": 250, "total_steps": 921, "loss": 0.6198, "learning_rate": 5e-06, "epoch": 0.8123476848090982, "percentage": 27.14, "elapsed_time": "1:07:37", "remaining_time": "3:01:29"}
{"current_steps": 260, "total_steps": 921, "loss": 0.6157, "learning_rate": 5e-06, "epoch": 0.8448415922014623, "percentage": 28.23, "elapsed_time": "1:10:18", "remaining_time": "2:58:45"}
{"current_steps": 270, "total_steps": 921, "loss": 0.6116, "learning_rate": 5e-06, "epoch": 0.8773354995938262, "percentage": 29.32, "elapsed_time": "1:13:00", "remaining_time": "2:56:02"}
{"current_steps": 280, "total_steps": 921, "loss": 0.6326, "learning_rate": 5e-06, "epoch": 0.9098294069861901, "percentage": 30.4, "elapsed_time": "1:15:42", "remaining_time": "2:53:18"}
{"current_steps": 290, "total_steps": 921, "loss": 0.6331, "learning_rate": 5e-06, "epoch": 0.942323314378554, "percentage": 31.49, "elapsed_time": "1:18:23", "remaining_time": "2:50:33"}
{"current_steps": 300, "total_steps": 921, "loss": 0.6185, "learning_rate": 5e-06, "epoch": 0.974817221770918, "percentage": 32.57, "elapsed_time": "1:21:04", "remaining_time": "2:47:49"}
{"current_steps": 307, "total_steps": 921, "eval_loss": 0.6177791357040405, "epoch": 0.9975629569455727, "percentage": 33.33, "elapsed_time": "1:24:57", "remaining_time": "2:49:54"}
{"current_steps": 310, "total_steps": 921, "loss": 0.6074, "learning_rate": 5e-06, "epoch": 1.007311129163282, "percentage": 33.66, "elapsed_time": "1:26:32", "remaining_time": "2:50:34"}
{"current_steps": 320, "total_steps": 921, "loss": 0.5701, "learning_rate": 5e-06, "epoch": 1.0398050365556457, "percentage": 34.74, "elapsed_time": "1:29:14", "remaining_time": "2:47:35"}
{"current_steps": 330, "total_steps": 921, "loss": 0.5836, "learning_rate": 5e-06, "epoch": 1.0722989439480097, "percentage": 35.83, "elapsed_time": "1:31:55", "remaining_time": "2:44:37"}
{"current_steps": 340, "total_steps": 921, "loss": 0.5676, "learning_rate": 5e-06, "epoch": 1.1047928513403737, "percentage": 36.92, "elapsed_time": "1:34:36", "remaining_time": "2:41:40"}
{"current_steps": 350, "total_steps": 921, "loss": 0.5722, "learning_rate": 5e-06, "epoch": 1.1372867587327375, "percentage": 38.0, "elapsed_time": "1:37:18", "remaining_time": "2:38:44"}
{"current_steps": 360, "total_steps": 921, "loss": 0.5692, "learning_rate": 5e-06, "epoch": 1.1697806661251016, "percentage": 39.09, "elapsed_time": "1:39:59", "remaining_time": "2:35:49"}
{"current_steps": 370, "total_steps": 921, "loss": 0.5716, "learning_rate": 5e-06, "epoch": 1.2022745735174656, "percentage": 40.17, "elapsed_time": "1:42:39", "remaining_time": "2:32:52"}
{"current_steps": 380, "total_steps": 921, "loss": 0.573, "learning_rate": 5e-06, "epoch": 1.2347684809098294, "percentage": 41.26, "elapsed_time": "1:45:20", "remaining_time": "2:29:58"}
{"current_steps": 390, "total_steps": 921, "loss": 0.5759, "learning_rate": 5e-06, "epoch": 1.2672623883021934, "percentage": 42.35, "elapsed_time": "1:48:01", "remaining_time": "2:27:04"}
{"current_steps": 400, "total_steps": 921, "loss": 0.5812, "learning_rate": 5e-06, "epoch": 1.2997562956945572, "percentage": 43.43, "elapsed_time": "1:50:41", "remaining_time": "2:24:10"}
{"current_steps": 410, "total_steps": 921, "loss": 0.5781, "learning_rate": 5e-06, "epoch": 1.3322502030869212, "percentage": 44.52, "elapsed_time": "1:53:23", "remaining_time": "2:21:19"}
{"current_steps": 420, "total_steps": 921, "loss": 0.5829, "learning_rate": 5e-06, "epoch": 1.3647441104792852, "percentage": 45.6, "elapsed_time": "1:56:04", "remaining_time": "2:18:27"}
{"current_steps": 430, "total_steps": 921, "loss": 0.5743, "learning_rate": 5e-06, "epoch": 1.397238017871649, "percentage": 46.69, "elapsed_time": "1:58:46", "remaining_time": "2:15:37"}
{"current_steps": 440, "total_steps": 921, "loss": 0.568, "learning_rate": 5e-06, "epoch": 1.429731925264013, "percentage": 47.77, "elapsed_time": "2:01:26", "remaining_time": "2:12:45"}
{"current_steps": 450, "total_steps": 921, "loss": 0.5688, "learning_rate": 5e-06, "epoch": 1.4622258326563768, "percentage": 48.86, "elapsed_time": "2:04:07", "remaining_time": "2:09:54"}
{"current_steps": 460, "total_steps": 921, "loss": 0.5765, "learning_rate": 5e-06, "epoch": 1.4947197400487409, "percentage": 49.95, "elapsed_time": "2:06:48", "remaining_time": "2:07:04"}
{"current_steps": 470, "total_steps": 921, "loss": 0.5709, "learning_rate": 5e-06, "epoch": 1.5272136474411049, "percentage": 51.03, "elapsed_time": "2:09:29", "remaining_time": "2:04:15"}
{"current_steps": 480, "total_steps": 921, "loss": 0.5744, "learning_rate": 5e-06, "epoch": 1.5597075548334687, "percentage": 52.12, "elapsed_time": "2:12:10", "remaining_time": "2:01:26"}
{"current_steps": 490, "total_steps": 921, "loss": 0.5736, "learning_rate": 5e-06, "epoch": 1.5922014622258327, "percentage": 53.2, "elapsed_time": "2:14:51", "remaining_time": "1:58:37"}
{"current_steps": 500, "total_steps": 921, "loss": 0.5644, "learning_rate": 5e-06, "epoch": 1.6246953696181965, "percentage": 54.29, "elapsed_time": "2:17:31", "remaining_time": "1:55:48"}
{"current_steps": 510, "total_steps": 921, "loss": 0.5631, "learning_rate": 5e-06, "epoch": 1.6571892770105605, "percentage": 55.37, "elapsed_time": "2:20:12", "remaining_time": "1:52:59"}
{"current_steps": 520, "total_steps": 921, "loss": 0.5736, "learning_rate": 5e-06, "epoch": 1.6896831844029245, "percentage": 56.46, "elapsed_time": "2:22:52", "remaining_time": "1:50:10"}
{"current_steps": 530, "total_steps": 921, "loss": 0.565, "learning_rate": 5e-06, "epoch": 1.7221770917952883, "percentage": 57.55, "elapsed_time": "2:25:32", "remaining_time": "1:47:22"}
{"current_steps": 540, "total_steps": 921, "loss": 0.5735, "learning_rate": 5e-06, "epoch": 1.7546709991876523, "percentage": 58.63, "elapsed_time": "2:28:13", "remaining_time": "1:44:34"}
{"current_steps": 550, "total_steps": 921, "loss": 0.5673, "learning_rate": 5e-06, "epoch": 1.7871649065800161, "percentage": 59.72, "elapsed_time": "2:30:53", "remaining_time": "1:41:46"}
{"current_steps": 560, "total_steps": 921, "loss": 0.5678, "learning_rate": 5e-06, "epoch": 1.8196588139723802, "percentage": 60.8, "elapsed_time": "2:33:34", "remaining_time": "1:39:00"}
{"current_steps": 570, "total_steps": 921, "loss": 0.5685, "learning_rate": 5e-06, "epoch": 1.8521527213647442, "percentage": 61.89, "elapsed_time": "2:36:14", "remaining_time": "1:36:12"}
{"current_steps": 580, "total_steps": 921, "loss": 0.5717, "learning_rate": 5e-06, "epoch": 1.8846466287571082, "percentage": 62.98, "elapsed_time": "2:38:55", "remaining_time": "1:33:26"}
{"current_steps": 590, "total_steps": 921, "loss": 0.5744, "learning_rate": 5e-06, "epoch": 1.917140536149472, "percentage": 64.06, "elapsed_time": "2:41:37", "remaining_time": "1:30:40"}
{"current_steps": 600, "total_steps": 921, "loss": 0.5646, "learning_rate": 5e-06, "epoch": 1.9496344435418358, "percentage": 65.15, "elapsed_time": "2:44:18", "remaining_time": "1:27:54"}
{"current_steps": 610, "total_steps": 921, "loss": 0.5652, "learning_rate": 5e-06, "epoch": 1.9821283509341998, "percentage": 66.23, "elapsed_time": "2:47:00", "remaining_time": "1:25:08"}
{"current_steps": 615, "total_steps": 921, "eval_loss": 0.6079972982406616, "epoch": 1.9983753046303818, "percentage": 66.78, "elapsed_time": "2:50:13", "remaining_time": "1:24:41"}
{"current_steps": 620, "total_steps": 921, "loss": 0.5462, "learning_rate": 5e-06, "epoch": 2.014622258326564, "percentage": 67.32, "elapsed_time": "2:52:32", "remaining_time": "1:23:45"}
{"current_steps": 630, "total_steps": 921, "loss": 0.5103, "learning_rate": 5e-06, "epoch": 2.047116165718928, "percentage": 68.4, "elapsed_time": "2:55:12", "remaining_time": "1:20:56"}
{"current_steps": 640, "total_steps": 921, "loss": 0.5161, "learning_rate": 5e-06, "epoch": 2.0796100731112914, "percentage": 69.49, "elapsed_time": "2:57:54", "remaining_time": "1:18:06"}
{"current_steps": 650, "total_steps": 921, "loss": 0.5166, "learning_rate": 5e-06, "epoch": 2.1121039805036554, "percentage": 70.58, "elapsed_time": "3:00:35", "remaining_time": "1:15:17"}
{"current_steps": 660, "total_steps": 921, "loss": 0.5057, "learning_rate": 5e-06, "epoch": 2.1445978878960195, "percentage": 71.66, "elapsed_time": "3:03:16", "remaining_time": "1:12:28"}
{"current_steps": 670, "total_steps": 921, "loss": 0.5193, "learning_rate": 5e-06, "epoch": 2.1770917952883835, "percentage": 72.75, "elapsed_time": "3:05:57", "remaining_time": "1:09:39"}
{"current_steps": 680, "total_steps": 921, "loss": 0.5261, "learning_rate": 5e-06, "epoch": 2.2095857026807475, "percentage": 73.83, "elapsed_time": "3:08:39", "remaining_time": "1:06:51"}
{"current_steps": 690, "total_steps": 921, "loss": 0.5216, "learning_rate": 5e-06, "epoch": 2.2420796100731115, "percentage": 74.92, "elapsed_time": "3:11:20", "remaining_time": "1:04:03"}
{"current_steps": 700, "total_steps": 921, "loss": 0.5239, "learning_rate": 5e-06, "epoch": 2.274573517465475, "percentage": 76.0, "elapsed_time": "3:14:01", "remaining_time": "1:01:15"}
{"current_steps": 710, "total_steps": 921, "loss": 0.518, "learning_rate": 5e-06, "epoch": 2.307067424857839, "percentage": 77.09, "elapsed_time": "3:16:43", "remaining_time": "0:58:27"}
{"current_steps": 720, "total_steps": 921, "loss": 0.5311, "learning_rate": 5e-06, "epoch": 2.339561332250203, "percentage": 78.18, "elapsed_time": "3:19:24", "remaining_time": "0:55:40"}
{"current_steps": 730, "total_steps": 921, "loss": 0.5225, "learning_rate": 5e-06, "epoch": 2.372055239642567, "percentage": 79.26, "elapsed_time": "3:22:05", "remaining_time": "0:52:52"}
{"current_steps": 740, "total_steps": 921, "loss": 0.5228, "learning_rate": 5e-06, "epoch": 2.404549147034931, "percentage": 80.35, "elapsed_time": "3:24:46", "remaining_time": "0:50:05"}
{"current_steps": 750, "total_steps": 921, "loss": 0.5269, "learning_rate": 5e-06, "epoch": 2.4370430544272947, "percentage": 81.43, "elapsed_time": "3:27:29", "remaining_time": "0:47:18"}
{"current_steps": 760, "total_steps": 921, "loss": 0.5175, "learning_rate": 5e-06, "epoch": 2.4695369618196588, "percentage": 82.52, "elapsed_time": "3:30:11", "remaining_time": "0:44:31"}
{"current_steps": 770, "total_steps": 921, "loss": 0.5219, "learning_rate": 5e-06, "epoch": 2.502030869212023, "percentage": 83.6, "elapsed_time": "3:32:53", "remaining_time": "0:41:44"}
{"current_steps": 780, "total_steps": 921, "loss": 0.5196, "learning_rate": 5e-06, "epoch": 2.534524776604387, "percentage": 84.69, "elapsed_time": "3:35:35", "remaining_time": "0:38:58"}
{"current_steps": 790, "total_steps": 921, "loss": 0.5167, "learning_rate": 5e-06, "epoch": 2.567018683996751, "percentage": 85.78, "elapsed_time": "3:38:15", "remaining_time": "0:36:11"}
{"current_steps": 800, "total_steps": 921, "loss": 0.5186, "learning_rate": 5e-06, "epoch": 2.5995125913891144, "percentage": 86.86, "elapsed_time": "3:40:56", "remaining_time": "0:33:24"}
{"current_steps": 810, "total_steps": 921, "loss": 0.5269, "learning_rate": 5e-06, "epoch": 2.6320064987814784, "percentage": 87.95, "elapsed_time": "3:43:36", "remaining_time": "0:30:38"}
{"current_steps": 820, "total_steps": 921, "loss": 0.5241, "learning_rate": 5e-06, "epoch": 2.6645004061738424, "percentage": 89.03, "elapsed_time": "3:46:18", "remaining_time": "0:27:52"}
{"current_steps": 830, "total_steps": 921, "loss": 0.52, "learning_rate": 5e-06, "epoch": 2.6969943135662064, "percentage": 90.12, "elapsed_time": "3:49:00", "remaining_time": "0:25:06"}
{"current_steps": 840, "total_steps": 921, "loss": 0.5218, "learning_rate": 5e-06, "epoch": 2.7294882209585705, "percentage": 91.21, "elapsed_time": "3:51:41", "remaining_time": "0:22:20"}
{"current_steps": 850, "total_steps": 921, "loss": 0.5295, "learning_rate": 5e-06, "epoch": 2.761982128350934, "percentage": 92.29, "elapsed_time": "3:54:23", "remaining_time": "0:19:34"}
{"current_steps": 860, "total_steps": 921, "loss": 0.5237, "learning_rate": 5e-06, "epoch": 2.794476035743298, "percentage": 93.38, "elapsed_time": "3:57:05", "remaining_time": "0:16:48"}
{"current_steps": 870, "total_steps": 921, "loss": 0.522, "learning_rate": 5e-06, "epoch": 2.826969943135662, "percentage": 94.46, "elapsed_time": "3:59:46", "remaining_time": "0:14:03"}
{"current_steps": 880, "total_steps": 921, "loss": 0.5188, "learning_rate": 5e-06, "epoch": 2.859463850528026, "percentage": 95.55, "elapsed_time": "4:02:28", "remaining_time": "0:11:17"}
{"current_steps": 890, "total_steps": 921, "loss": 0.5252, "learning_rate": 5e-06, "epoch": 2.89195775792039, "percentage": 96.63, "elapsed_time": "4:05:08", "remaining_time": "0:08:32"}
{"current_steps": 900, "total_steps": 921, "loss": 0.5181, "learning_rate": 5e-06, "epoch": 2.9244516653127537, "percentage": 97.72, "elapsed_time": "4:07:49", "remaining_time": "0:05:46"}
{"current_steps": 910, "total_steps": 921, "loss": 0.5282, "learning_rate": 5e-06, "epoch": 2.9569455727051177, "percentage": 98.81, "elapsed_time": "4:10:29", "remaining_time": "0:03:01"}
{"current_steps": 920, "total_steps": 921, "loss": 0.5197, "learning_rate": 5e-06, "epoch": 2.9894394800974817, "percentage": 99.89, "elapsed_time": "4:13:09", "remaining_time": "0:00:16"}
{"current_steps": 921, "total_steps": 921, "eval_loss": 0.6120628714561462, "epoch": 2.992688870836718, "percentage": 100.0, "elapsed_time": "4:16:16", "remaining_time": "0:00:00"}
{"current_steps": 921, "total_steps": 921, "epoch": 2.992688870836718, "percentage": 100.0, "elapsed_time": "4:17:12", "remaining_time": "0:00:00"}