gsmyrnis's picture
Training in progress, epoch 2
5c738af verified
{"current_steps": 10, "total_steps": 867, "loss": 0.9289, "learning_rate": 5e-06, "epoch": 0.03460207612456748, "percentage": 1.15, "elapsed_time": "0:01:03", "remaining_time": "1:30:00"}
{"current_steps": 20, "total_steps": 867, "loss": 0.8126, "learning_rate": 5e-06, "epoch": 0.06920415224913495, "percentage": 2.31, "elapsed_time": "0:02:05", "remaining_time": "1:28:43"}
{"current_steps": 30, "total_steps": 867, "loss": 0.7742, "learning_rate": 5e-06, "epoch": 0.10380622837370242, "percentage": 3.46, "elapsed_time": "0:03:07", "remaining_time": "1:27:21"}
{"current_steps": 40, "total_steps": 867, "loss": 0.747, "learning_rate": 5e-06, "epoch": 0.1384083044982699, "percentage": 4.61, "elapsed_time": "0:04:10", "remaining_time": "1:26:21"}
{"current_steps": 50, "total_steps": 867, "loss": 0.7119, "learning_rate": 5e-06, "epoch": 0.17301038062283736, "percentage": 5.77, "elapsed_time": "0:05:12", "remaining_time": "1:25:10"}
{"current_steps": 60, "total_steps": 867, "loss": 0.688, "learning_rate": 5e-06, "epoch": 0.20761245674740483, "percentage": 6.92, "elapsed_time": "0:06:15", "remaining_time": "1:24:08"}
{"current_steps": 70, "total_steps": 867, "loss": 0.6709, "learning_rate": 5e-06, "epoch": 0.2422145328719723, "percentage": 8.07, "elapsed_time": "0:07:17", "remaining_time": "1:23:02"}
{"current_steps": 80, "total_steps": 867, "loss": 0.6633, "learning_rate": 5e-06, "epoch": 0.2768166089965398, "percentage": 9.23, "elapsed_time": "0:08:20", "remaining_time": "1:22:05"}
{"current_steps": 90, "total_steps": 867, "loss": 0.659, "learning_rate": 5e-06, "epoch": 0.31141868512110726, "percentage": 10.38, "elapsed_time": "0:09:22", "remaining_time": "1:20:58"}
{"current_steps": 100, "total_steps": 867, "loss": 0.6368, "learning_rate": 5e-06, "epoch": 0.3460207612456747, "percentage": 11.53, "elapsed_time": "0:10:25", "remaining_time": "1:19:54"}
{"current_steps": 110, "total_steps": 867, "loss": 0.642, "learning_rate": 5e-06, "epoch": 0.3806228373702422, "percentage": 12.69, "elapsed_time": "0:11:27", "remaining_time": "1:18:51"}
{"current_steps": 120, "total_steps": 867, "loss": 0.6332, "learning_rate": 5e-06, "epoch": 0.41522491349480967, "percentage": 13.84, "elapsed_time": "0:12:31", "remaining_time": "1:17:59"}
{"current_steps": 130, "total_steps": 867, "loss": 0.6317, "learning_rate": 5e-06, "epoch": 0.44982698961937717, "percentage": 14.99, "elapsed_time": "0:13:35", "remaining_time": "1:17:02"}
{"current_steps": 140, "total_steps": 867, "loss": 0.6308, "learning_rate": 5e-06, "epoch": 0.4844290657439446, "percentage": 16.15, "elapsed_time": "0:14:37", "remaining_time": "1:15:56"}
{"current_steps": 150, "total_steps": 867, "loss": 0.6297, "learning_rate": 5e-06, "epoch": 0.5190311418685121, "percentage": 17.3, "elapsed_time": "0:15:39", "remaining_time": "1:14:52"}
{"current_steps": 160, "total_steps": 867, "loss": 0.6251, "learning_rate": 5e-06, "epoch": 0.5536332179930796, "percentage": 18.45, "elapsed_time": "0:16:42", "remaining_time": "1:13:48"}
{"current_steps": 170, "total_steps": 867, "loss": 0.609, "learning_rate": 5e-06, "epoch": 0.5882352941176471, "percentage": 19.61, "elapsed_time": "0:17:44", "remaining_time": "1:12:44"}
{"current_steps": 180, "total_steps": 867, "loss": 0.6186, "learning_rate": 5e-06, "epoch": 0.6228373702422145, "percentage": 20.76, "elapsed_time": "0:18:48", "remaining_time": "1:11:46"}
{"current_steps": 190, "total_steps": 867, "loss": 0.6201, "learning_rate": 5e-06, "epoch": 0.657439446366782, "percentage": 21.91, "elapsed_time": "0:19:53", "remaining_time": "1:10:52"}
{"current_steps": 200, "total_steps": 867, "loss": 0.6176, "learning_rate": 5e-06, "epoch": 0.6920415224913494, "percentage": 23.07, "elapsed_time": "0:20:55", "remaining_time": "1:09:47"}
{"current_steps": 210, "total_steps": 867, "loss": 0.612, "learning_rate": 5e-06, "epoch": 0.726643598615917, "percentage": 24.22, "elapsed_time": "0:21:57", "remaining_time": "1:08:42"}
{"current_steps": 220, "total_steps": 867, "loss": 0.6069, "learning_rate": 5e-06, "epoch": 0.7612456747404844, "percentage": 25.37, "elapsed_time": "0:22:59", "remaining_time": "1:07:38"}
{"current_steps": 230, "total_steps": 867, "loss": 0.6055, "learning_rate": 5e-06, "epoch": 0.7958477508650519, "percentage": 26.53, "elapsed_time": "0:24:03", "remaining_time": "1:06:37"}
{"current_steps": 240, "total_steps": 867, "loss": 0.6068, "learning_rate": 5e-06, "epoch": 0.8304498269896193, "percentage": 27.68, "elapsed_time": "0:25:05", "remaining_time": "1:05:32"}
{"current_steps": 250, "total_steps": 867, "loss": 0.6026, "learning_rate": 5e-06, "epoch": 0.8650519031141869, "percentage": 28.84, "elapsed_time": "0:26:07", "remaining_time": "1:04:28"}
{"current_steps": 260, "total_steps": 867, "loss": 0.6077, "learning_rate": 5e-06, "epoch": 0.8996539792387543, "percentage": 29.99, "elapsed_time": "0:27:09", "remaining_time": "1:03:24"}
{"current_steps": 270, "total_steps": 867, "loss": 0.6031, "learning_rate": 5e-06, "epoch": 0.9342560553633218, "percentage": 31.14, "elapsed_time": "0:28:12", "remaining_time": "1:02:22"}
{"current_steps": 280, "total_steps": 867, "loss": 0.6051, "learning_rate": 5e-06, "epoch": 0.9688581314878892, "percentage": 32.3, "elapsed_time": "0:29:14", "remaining_time": "1:01:18"}
{"current_steps": 289, "total_steps": 867, "eval_loss": 0.6054237484931946, "epoch": 1.0, "percentage": 33.33, "elapsed_time": "0:30:37", "remaining_time": "1:01:14"}
{"current_steps": 290, "total_steps": 867, "loss": 0.5952, "learning_rate": 5e-06, "epoch": 1.0034602076124568, "percentage": 33.45, "elapsed_time": "0:34:40", "remaining_time": "1:08:59"}
{"current_steps": 300, "total_steps": 867, "loss": 0.558, "learning_rate": 5e-06, "epoch": 1.0380622837370241, "percentage": 34.6, "elapsed_time": "0:35:42", "remaining_time": "1:07:30"}
{"current_steps": 310, "total_steps": 867, "loss": 0.5671, "learning_rate": 5e-06, "epoch": 1.0726643598615917, "percentage": 35.76, "elapsed_time": "0:36:45", "remaining_time": "1:06:02"}
{"current_steps": 320, "total_steps": 867, "loss": 0.5575, "learning_rate": 5e-06, "epoch": 1.1072664359861593, "percentage": 36.91, "elapsed_time": "0:37:47", "remaining_time": "1:04:35"}
{"current_steps": 330, "total_steps": 867, "loss": 0.5663, "learning_rate": 5e-06, "epoch": 1.1418685121107266, "percentage": 38.06, "elapsed_time": "0:38:49", "remaining_time": "1:03:11"}
{"current_steps": 340, "total_steps": 867, "loss": 0.5553, "learning_rate": 5e-06, "epoch": 1.1764705882352942, "percentage": 39.22, "elapsed_time": "0:39:52", "remaining_time": "1:01:48"}
{"current_steps": 350, "total_steps": 867, "loss": 0.5524, "learning_rate": 5e-06, "epoch": 1.2110726643598615, "percentage": 40.37, "elapsed_time": "0:40:54", "remaining_time": "1:00:25"}
{"current_steps": 360, "total_steps": 867, "loss": 0.5648, "learning_rate": 5e-06, "epoch": 1.245674740484429, "percentage": 41.52, "elapsed_time": "0:41:57", "remaining_time": "0:59:05"}
{"current_steps": 370, "total_steps": 867, "loss": 0.5566, "learning_rate": 5e-06, "epoch": 1.2802768166089966, "percentage": 42.68, "elapsed_time": "0:42:59", "remaining_time": "0:57:45"}
{"current_steps": 380, "total_steps": 867, "loss": 0.5596, "learning_rate": 5e-06, "epoch": 1.314878892733564, "percentage": 43.83, "elapsed_time": "0:44:02", "remaining_time": "0:56:26"}
{"current_steps": 390, "total_steps": 867, "loss": 0.5566, "learning_rate": 5e-06, "epoch": 1.3494809688581315, "percentage": 44.98, "elapsed_time": "0:45:04", "remaining_time": "0:55:08"}
{"current_steps": 400, "total_steps": 867, "loss": 0.5582, "learning_rate": 5e-06, "epoch": 1.3840830449826989, "percentage": 46.14, "elapsed_time": "0:46:07", "remaining_time": "0:53:50"}
{"current_steps": 410, "total_steps": 867, "loss": 0.5611, "learning_rate": 5e-06, "epoch": 1.4186851211072664, "percentage": 47.29, "elapsed_time": "0:47:10", "remaining_time": "0:52:34"}
{"current_steps": 420, "total_steps": 867, "loss": 0.5552, "learning_rate": 5e-06, "epoch": 1.453287197231834, "percentage": 48.44, "elapsed_time": "0:48:12", "remaining_time": "0:51:18"}
{"current_steps": 430, "total_steps": 867, "loss": 0.5688, "learning_rate": 5e-06, "epoch": 1.4878892733564013, "percentage": 49.6, "elapsed_time": "0:49:15", "remaining_time": "0:50:03"}
{"current_steps": 440, "total_steps": 867, "loss": 0.5525, "learning_rate": 5e-06, "epoch": 1.5224913494809689, "percentage": 50.75, "elapsed_time": "0:50:17", "remaining_time": "0:48:48"}
{"current_steps": 450, "total_steps": 867, "loss": 0.5617, "learning_rate": 5e-06, "epoch": 1.5570934256055362, "percentage": 51.9, "elapsed_time": "0:51:19", "remaining_time": "0:47:34"}
{"current_steps": 460, "total_steps": 867, "loss": 0.5678, "learning_rate": 5e-06, "epoch": 1.5916955017301038, "percentage": 53.06, "elapsed_time": "0:52:22", "remaining_time": "0:46:20"}
{"current_steps": 470, "total_steps": 867, "loss": 0.5608, "learning_rate": 5e-06, "epoch": 1.6262975778546713, "percentage": 54.21, "elapsed_time": "0:53:24", "remaining_time": "0:45:07"}
{"current_steps": 480, "total_steps": 867, "loss": 0.5622, "learning_rate": 5e-06, "epoch": 1.6608996539792389, "percentage": 55.36, "elapsed_time": "0:54:27", "remaining_time": "0:43:54"}
{"current_steps": 490, "total_steps": 867, "loss": 0.5498, "learning_rate": 5e-06, "epoch": 1.6955017301038062, "percentage": 56.52, "elapsed_time": "0:55:29", "remaining_time": "0:42:41"}
{"current_steps": 500, "total_steps": 867, "loss": 0.5514, "learning_rate": 5e-06, "epoch": 1.7301038062283736, "percentage": 57.67, "elapsed_time": "0:56:32", "remaining_time": "0:41:29"}
{"current_steps": 510, "total_steps": 867, "loss": 0.5632, "learning_rate": 5e-06, "epoch": 1.7647058823529411, "percentage": 58.82, "elapsed_time": "0:57:34", "remaining_time": "0:40:18"}
{"current_steps": 520, "total_steps": 867, "loss": 0.559, "learning_rate": 5e-06, "epoch": 1.7993079584775087, "percentage": 59.98, "elapsed_time": "0:58:37", "remaining_time": "0:39:06"}
{"current_steps": 530, "total_steps": 867, "loss": 0.5522, "learning_rate": 5e-06, "epoch": 1.8339100346020762, "percentage": 61.13, "elapsed_time": "0:59:39", "remaining_time": "0:37:56"}
{"current_steps": 540, "total_steps": 867, "loss": 0.5537, "learning_rate": 5e-06, "epoch": 1.8685121107266436, "percentage": 62.28, "elapsed_time": "1:00:42", "remaining_time": "0:36:45"}
{"current_steps": 550, "total_steps": 867, "loss": 0.5557, "learning_rate": 5e-06, "epoch": 1.903114186851211, "percentage": 63.44, "elapsed_time": "1:01:44", "remaining_time": "0:35:35"}
{"current_steps": 560, "total_steps": 867, "loss": 0.5481, "learning_rate": 5e-06, "epoch": 1.9377162629757785, "percentage": 64.59, "elapsed_time": "1:02:46", "remaining_time": "0:34:25"}
{"current_steps": 570, "total_steps": 867, "loss": 0.5546, "learning_rate": 5e-06, "epoch": 1.972318339100346, "percentage": 65.74, "elapsed_time": "1:03:49", "remaining_time": "0:33:15"}
{"current_steps": 578, "total_steps": 867, "eval_loss": 0.5923461318016052, "epoch": 2.0, "percentage": 66.67, "elapsed_time": "1:05:04", "remaining_time": "0:32:32"}
{"current_steps": 580, "total_steps": 867, "loss": 0.5407, "learning_rate": 5e-06, "epoch": 2.0069204152249136, "percentage": 66.9, "elapsed_time": "1:09:13", "remaining_time": "0:34:15"}
{"current_steps": 590, "total_steps": 867, "loss": 0.51, "learning_rate": 5e-06, "epoch": 2.041522491349481, "percentage": 68.05, "elapsed_time": "1:10:16", "remaining_time": "0:32:59"}
{"current_steps": 600, "total_steps": 867, "loss": 0.5043, "learning_rate": 5e-06, "epoch": 2.0761245674740483, "percentage": 69.2, "elapsed_time": "1:11:18", "remaining_time": "0:31:43"}
{"current_steps": 610, "total_steps": 867, "loss": 0.508, "learning_rate": 5e-06, "epoch": 2.110726643598616, "percentage": 70.36, "elapsed_time": "1:12:20", "remaining_time": "0:30:28"}
{"current_steps": 620, "total_steps": 867, "loss": 0.5109, "learning_rate": 5e-06, "epoch": 2.1453287197231834, "percentage": 71.51, "elapsed_time": "1:13:23", "remaining_time": "0:29:14"}
{"current_steps": 630, "total_steps": 867, "loss": 0.5151, "learning_rate": 5e-06, "epoch": 2.179930795847751, "percentage": 72.66, "elapsed_time": "1:14:25", "remaining_time": "0:27:59"}
{"current_steps": 640, "total_steps": 867, "loss": 0.5119, "learning_rate": 5e-06, "epoch": 2.2145328719723185, "percentage": 73.82, "elapsed_time": "1:15:28", "remaining_time": "0:26:46"}
{"current_steps": 650, "total_steps": 867, "loss": 0.5113, "learning_rate": 5e-06, "epoch": 2.2491349480968856, "percentage": 74.97, "elapsed_time": "1:16:30", "remaining_time": "0:25:32"}
{"current_steps": 660, "total_steps": 867, "loss": 0.5131, "learning_rate": 5e-06, "epoch": 2.283737024221453, "percentage": 76.12, "elapsed_time": "1:17:33", "remaining_time": "0:24:19"}
{"current_steps": 670, "total_steps": 867, "loss": 0.5115, "learning_rate": 5e-06, "epoch": 2.3183391003460208, "percentage": 77.28, "elapsed_time": "1:18:35", "remaining_time": "0:23:06"}
{"current_steps": 680, "total_steps": 867, "loss": 0.5188, "learning_rate": 5e-06, "epoch": 2.3529411764705883, "percentage": 78.43, "elapsed_time": "1:19:38", "remaining_time": "0:21:54"}
{"current_steps": 690, "total_steps": 867, "loss": 0.5135, "learning_rate": 5e-06, "epoch": 2.387543252595156, "percentage": 79.58, "elapsed_time": "1:20:40", "remaining_time": "0:20:41"}
{"current_steps": 700, "total_steps": 867, "loss": 0.5182, "learning_rate": 5e-06, "epoch": 2.422145328719723, "percentage": 80.74, "elapsed_time": "1:21:43", "remaining_time": "0:19:29"}
{"current_steps": 710, "total_steps": 867, "loss": 0.5085, "learning_rate": 5e-06, "epoch": 2.4567474048442905, "percentage": 81.89, "elapsed_time": "1:22:45", "remaining_time": "0:18:18"}
{"current_steps": 720, "total_steps": 867, "loss": 0.514, "learning_rate": 5e-06, "epoch": 2.491349480968858, "percentage": 83.04, "elapsed_time": "1:23:47", "remaining_time": "0:17:06"}
{"current_steps": 730, "total_steps": 867, "loss": 0.5094, "learning_rate": 5e-06, "epoch": 2.5259515570934257, "percentage": 84.2, "elapsed_time": "1:24:50", "remaining_time": "0:15:55"}
{"current_steps": 740, "total_steps": 867, "loss": 0.5138, "learning_rate": 5e-06, "epoch": 2.5605536332179932, "percentage": 85.35, "elapsed_time": "1:25:53", "remaining_time": "0:14:44"}
{"current_steps": 750, "total_steps": 867, "loss": 0.5192, "learning_rate": 5e-06, "epoch": 2.595155709342561, "percentage": 86.51, "elapsed_time": "1:26:56", "remaining_time": "0:13:33"}
{"current_steps": 760, "total_steps": 867, "loss": 0.5122, "learning_rate": 5e-06, "epoch": 2.629757785467128, "percentage": 87.66, "elapsed_time": "1:27:58", "remaining_time": "0:12:23"}
{"current_steps": 770, "total_steps": 867, "loss": 0.5136, "learning_rate": 5e-06, "epoch": 2.6643598615916955, "percentage": 88.81, "elapsed_time": "1:29:01", "remaining_time": "0:11:12"}
{"current_steps": 780, "total_steps": 867, "loss": 0.5147, "learning_rate": 5e-06, "epoch": 2.698961937716263, "percentage": 89.97, "elapsed_time": "1:30:03", "remaining_time": "0:10:02"}
{"current_steps": 790, "total_steps": 867, "loss": 0.5147, "learning_rate": 5e-06, "epoch": 2.7335640138408306, "percentage": 91.12, "elapsed_time": "1:31:05", "remaining_time": "0:08:52"}
{"current_steps": 800, "total_steps": 867, "loss": 0.5104, "learning_rate": 5e-06, "epoch": 2.7681660899653977, "percentage": 92.27, "elapsed_time": "1:32:08", "remaining_time": "0:07:42"}
{"current_steps": 810, "total_steps": 867, "loss": 0.5128, "learning_rate": 5e-06, "epoch": 2.8027681660899653, "percentage": 93.43, "elapsed_time": "1:33:10", "remaining_time": "0:06:33"}
{"current_steps": 820, "total_steps": 867, "loss": 0.5132, "learning_rate": 5e-06, "epoch": 2.837370242214533, "percentage": 94.58, "elapsed_time": "1:34:13", "remaining_time": "0:05:24"}
{"current_steps": 830, "total_steps": 867, "loss": 0.5074, "learning_rate": 5e-06, "epoch": 2.8719723183391004, "percentage": 95.73, "elapsed_time": "1:35:15", "remaining_time": "0:04:14"}
{"current_steps": 840, "total_steps": 867, "loss": 0.5215, "learning_rate": 5e-06, "epoch": 2.906574394463668, "percentage": 96.89, "elapsed_time": "1:36:18", "remaining_time": "0:03:05"}
{"current_steps": 850, "total_steps": 867, "loss": 0.5102, "learning_rate": 5e-06, "epoch": 2.9411764705882355, "percentage": 98.04, "elapsed_time": "1:37:21", "remaining_time": "0:01:56"}
{"current_steps": 860, "total_steps": 867, "loss": 0.5168, "learning_rate": 5e-06, "epoch": 2.9757785467128026, "percentage": 99.19, "elapsed_time": "1:38:24", "remaining_time": "0:00:48"}
{"current_steps": 867, "total_steps": 867, "eval_loss": 0.5936245918273926, "epoch": 3.0, "percentage": 100.0, "elapsed_time": "1:42:52", "remaining_time": "0:00:00"}
{"current_steps": 867, "total_steps": 867, "epoch": 3.0, "percentage": 100.0, "elapsed_time": "1:46:11", "remaining_time": "0:00:00"}