SKNahin commited on
Commit
caabed1
1 Parent(s): 1d077f7

Training in progress, step 4671

Browse files
model-00001-of-00002.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:36d593400d3e815816221b20e5851a5396ba2fc628de3eed28f55b67e80016e1
3
  size 4965799096
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bd5b54c84b76640ffebf0954f00fd2ec61bc957e8665038db051e17448df290b
3
  size 4965799096
model-00002-of-00002.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:6f3d4e06d5817b08c3f661ae2a3d4a16728c75eb0b0c06ad89e1d1d5b0760bf6
3
  size 1459729952
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ae45ae9af4a5e93ccb164f22cc8d2ad1e9cedd8a0b3680d357d3c56d00fb5a37
3
  size 1459729952
trainer_log.jsonl CHANGED
@@ -4507,3 +4507,166 @@
4507
  {"current_steps": 4507, "total_steps": 4671, "loss": 0.6902, "learning_rate": 1.2402305505128553e-07, "epoch": 0.9648122876026866, "percentage": 96.49, "elapsed_time": "23:00:27", "remaining_time": "0:50:13"}
4508
  {"current_steps": 4508, "total_steps": 4671, "loss": 0.6883, "learning_rate": 1.2251673136858931e-07, "epoch": 0.9650263573359021, "percentage": 96.51, "elapsed_time": "23:00:46", "remaining_time": "0:49:55"}
4509
  {"current_steps": 4509, "total_steps": 4671, "loss": 0.6963, "learning_rate": 1.2101958309578275e-07, "epoch": 0.9652404270691177, "percentage": 96.53, "elapsed_time": "23:01:04", "remaining_time": "0:49:37"}
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
4507
  {"current_steps": 4507, "total_steps": 4671, "loss": 0.6902, "learning_rate": 1.2402305505128553e-07, "epoch": 0.9648122876026866, "percentage": 96.49, "elapsed_time": "23:00:27", "remaining_time": "0:50:13"}
4508
  {"current_steps": 4508, "total_steps": 4671, "loss": 0.6883, "learning_rate": 1.2251673136858931e-07, "epoch": 0.9650263573359021, "percentage": 96.51, "elapsed_time": "23:00:46", "remaining_time": "0:49:55"}
4509
  {"current_steps": 4509, "total_steps": 4671, "loss": 0.6963, "learning_rate": 1.2101958309578275e-07, "epoch": 0.9652404270691177, "percentage": 96.53, "elapsed_time": "23:01:04", "remaining_time": "0:49:37"}
4510
+ {"current_steps": 4510, "total_steps": 4671, "loss": 0.6621, "learning_rate": 1.1953161092394637e-07, "epoch": 0.9654544968023333, "percentage": 96.55, "elapsed_time": "23:01:22", "remaining_time": "0:49:18"}
4511
+ {"current_steps": 4511, "total_steps": 4671, "loss": 0.7218, "learning_rate": 1.1805281553992631e-07, "epoch": 0.965668566535549, "percentage": 96.57, "elapsed_time": "23:01:41", "remaining_time": "0:49:00"}
4512
+ {"current_steps": 4512, "total_steps": 4671, "loss": 0.6955, "learning_rate": 1.1658319762633207e-07, "epoch": 0.9658826362687646, "percentage": 96.6, "elapsed_time": "23:01:59", "remaining_time": "0:48:42"}
4513
+ {"current_steps": 4513, "total_steps": 4671, "loss": 0.6829, "learning_rate": 1.1512275786153437e-07, "epoch": 0.9660967060019802, "percentage": 96.62, "elapsed_time": "23:02:17", "remaining_time": "0:48:23"}
4514
+ {"current_steps": 4514, "total_steps": 4671, "loss": 0.6828, "learning_rate": 1.136714969196695e-07, "epoch": 0.9663107757351957, "percentage": 96.64, "elapsed_time": "23:02:36", "remaining_time": "0:48:05"}
4515
+ {"current_steps": 4515, "total_steps": 4671, "loss": 0.6815, "learning_rate": 1.1222941547064159e-07, "epoch": 0.9665248454684113, "percentage": 96.66, "elapsed_time": "23:02:54", "remaining_time": "0:47:46"}
4516
+ {"current_steps": 4516, "total_steps": 4671, "loss": 0.6569, "learning_rate": 1.1079651418010706e-07, "epoch": 0.9667389152016269, "percentage": 96.68, "elapsed_time": "23:03:12", "remaining_time": "0:47:28"}
4517
+ {"current_steps": 4517, "total_steps": 4671, "loss": 0.6904, "learning_rate": 1.0937279370949461e-07, "epoch": 0.9669529849348425, "percentage": 96.7, "elapsed_time": "23:03:31", "remaining_time": "0:47:10"}
4518
+ {"current_steps": 4518, "total_steps": 4671, "loss": 0.6825, "learning_rate": 1.0795825471598742e-07, "epoch": 0.9671670546680581, "percentage": 96.72, "elapsed_time": "23:03:49", "remaining_time": "0:46:51"}
4519
+ {"current_steps": 4519, "total_steps": 4671, "loss": 0.6813, "learning_rate": 1.0655289785253875e-07, "epoch": 0.9673811244012737, "percentage": 96.75, "elapsed_time": "23:04:07", "remaining_time": "0:46:33"}
4520
+ {"current_steps": 4520, "total_steps": 4671, "loss": 0.6915, "learning_rate": 1.0515672376785413e-07, "epoch": 0.9675951941344894, "percentage": 96.77, "elapsed_time": "23:04:26", "remaining_time": "0:46:14"}
4521
+ {"current_steps": 4521, "total_steps": 4671, "loss": 0.6847, "learning_rate": 1.0376973310640692e-07, "epoch": 0.9678092638677049, "percentage": 96.79, "elapsed_time": "23:04:44", "remaining_time": "0:45:56"}
4522
+ {"current_steps": 4522, "total_steps": 4671, "loss": 0.6819, "learning_rate": 1.0239192650842944e-07, "epoch": 0.9680233336009205, "percentage": 96.81, "elapsed_time": "23:05:02", "remaining_time": "0:45:38"}
4523
+ {"current_steps": 4523, "total_steps": 4671, "loss": 0.7287, "learning_rate": 1.0102330460991516e-07, "epoch": 0.9682374033341361, "percentage": 96.83, "elapsed_time": "23:05:20", "remaining_time": "0:45:19"}
4524
+ {"current_steps": 4524, "total_steps": 4671, "loss": 0.6857, "learning_rate": 9.966386804261651e-08, "epoch": 0.9684514730673517, "percentage": 96.85, "elapsed_time": "23:05:39", "remaining_time": "0:45:01"}
4525
+ {"current_steps": 4525, "total_steps": 4671, "loss": 0.6998, "learning_rate": 9.831361743404711e-08, "epoch": 0.9686655428005673, "percentage": 96.87, "elapsed_time": "23:05:57", "remaining_time": "0:44:43"}
4526
+ {"current_steps": 4526, "total_steps": 4671, "loss": 0.6638, "learning_rate": 9.697255340748169e-08, "epoch": 0.9688796125337829, "percentage": 96.9, "elapsed_time": "23:06:15", "remaining_time": "0:44:24"}
4527
+ {"current_steps": 4527, "total_steps": 4671, "loss": 0.6685, "learning_rate": 9.564067658195175e-08, "epoch": 0.9690936822669984, "percentage": 96.92, "elapsed_time": "23:06:34", "remaining_time": "0:44:06"}
4528
+ {"current_steps": 4528, "total_steps": 4671, "loss": 0.6734, "learning_rate": 9.431798757224775e-08, "epoch": 0.969307752000214, "percentage": 96.94, "elapsed_time": "23:06:52", "remaining_time": "0:43:47"}
4529
+ {"current_steps": 4529, "total_steps": 4671, "loss": 0.7031, "learning_rate": 9.300448698892128e-08, "epoch": 0.9695218217334297, "percentage": 96.96, "elapsed_time": "23:07:10", "remaining_time": "0:43:29"}
4530
+ {"current_steps": 4530, "total_steps": 4671, "loss": 0.6823, "learning_rate": 9.170017543828291e-08, "epoch": 0.9697358914666453, "percentage": 96.98, "elapsed_time": "23:07:29", "remaining_time": "0:43:11"}
4531
+ {"current_steps": 4531, "total_steps": 4671, "loss": 0.6692, "learning_rate": 9.040505352240215e-08, "epoch": 0.9699499611998609, "percentage": 97.0, "elapsed_time": "23:07:47", "remaining_time": "0:42:52"}
4532
+ {"current_steps": 4532, "total_steps": 4671, "loss": 0.7383, "learning_rate": 8.911912183910077e-08, "epoch": 0.9701640309330765, "percentage": 97.02, "elapsed_time": "23:08:05", "remaining_time": "0:42:34"}
4533
+ {"current_steps": 4533, "total_steps": 4671, "loss": 0.6859, "learning_rate": 8.784238098196396e-08, "epoch": 0.970378100666292, "percentage": 97.05, "elapsed_time": "23:08:24", "remaining_time": "0:42:16"}
4534
+ {"current_steps": 4534, "total_steps": 4671, "loss": 0.6821, "learning_rate": 8.657483154033586e-08, "epoch": 0.9705921703995076, "percentage": 97.07, "elapsed_time": "23:08:42", "remaining_time": "0:41:57"}
4535
+ {"current_steps": 4535, "total_steps": 4671, "loss": 0.6674, "learning_rate": 8.531647409931065e-08, "epoch": 0.9708062401327232, "percentage": 97.09, "elapsed_time": "23:09:00", "remaining_time": "0:41:39"}
4536
+ {"current_steps": 4536, "total_steps": 4671, "loss": 0.689, "learning_rate": 8.406730923974593e-08, "epoch": 0.9710203098659388, "percentage": 97.11, "elapsed_time": "23:09:19", "remaining_time": "0:41:20"}
4537
+ {"current_steps": 4537, "total_steps": 4671, "loss": 0.7005, "learning_rate": 8.282733753825378e-08, "epoch": 0.9712343795991544, "percentage": 97.13, "elapsed_time": "23:09:37", "remaining_time": "0:41:02"}
4538
+ {"current_steps": 4538, "total_steps": 4671, "loss": 0.6937, "learning_rate": 8.159655956720303e-08, "epoch": 0.9714484493323701, "percentage": 97.15, "elapsed_time": "23:09:55", "remaining_time": "0:40:44"}
4539
+ {"current_steps": 4539, "total_steps": 4671, "loss": 0.6826, "learning_rate": 8.037497589471699e-08, "epoch": 0.9716625190655857, "percentage": 97.17, "elapsed_time": "23:10:14", "remaining_time": "0:40:25"}
4540
+ {"current_steps": 4540, "total_steps": 4671, "loss": 0.6925, "learning_rate": 7.916258708468016e-08, "epoch": 0.9718765887988012, "percentage": 97.2, "elapsed_time": "23:10:32", "remaining_time": "0:40:07"}
4541
+ {"current_steps": 4541, "total_steps": 4671, "loss": 0.6641, "learning_rate": 7.79593936967249e-08, "epoch": 0.9720906585320168, "percentage": 97.22, "elapsed_time": "23:10:50", "remaining_time": "0:39:49"}
4542
+ {"current_steps": 4542, "total_steps": 4671, "loss": 0.6759, "learning_rate": 7.676539628624469e-08, "epoch": 0.9723047282652324, "percentage": 97.24, "elapsed_time": "23:11:09", "remaining_time": "0:39:30"}
4543
+ {"current_steps": 4543, "total_steps": 4671, "loss": 0.7079, "learning_rate": 7.558059540438755e-08, "epoch": 0.972518797998448, "percentage": 97.26, "elapsed_time": "23:11:27", "remaining_time": "0:39:12"}
4544
+ {"current_steps": 4544, "total_steps": 4671, "loss": 0.6713, "learning_rate": 7.440499159805381e-08, "epoch": 0.9727328677316636, "percentage": 97.28, "elapsed_time": "23:11:45", "remaining_time": "0:38:53"}
4545
+ {"current_steps": 4545, "total_steps": 4671, "loss": 0.6828, "learning_rate": 7.323858540990047e-08, "epoch": 0.9729469374648791, "percentage": 97.3, "elapsed_time": "23:12:03", "remaining_time": "0:38:35"}
4546
+ {"current_steps": 4546, "total_steps": 4671, "loss": 0.701, "learning_rate": 7.208137737833908e-08, "epoch": 0.9731610071980947, "percentage": 97.32, "elapsed_time": "23:12:22", "remaining_time": "0:38:17"}
4547
+ {"current_steps": 4547, "total_steps": 4671, "loss": 0.6907, "learning_rate": 7.093336803753347e-08, "epoch": 0.9733750769313104, "percentage": 97.35, "elapsed_time": "23:12:40", "remaining_time": "0:37:58"}
4548
+ {"current_steps": 4548, "total_steps": 4671, "loss": 0.6972, "learning_rate": 6.979455791740641e-08, "epoch": 0.973589146664526, "percentage": 97.37, "elapsed_time": "23:12:58", "remaining_time": "0:37:40"}
4549
+ {"current_steps": 4549, "total_steps": 4671, "loss": 0.7268, "learning_rate": 6.86649475436263e-08, "epoch": 0.9738032163977416, "percentage": 97.39, "elapsed_time": "23:13:17", "remaining_time": "0:37:22"}
4550
+ {"current_steps": 4550, "total_steps": 4671, "loss": 0.682, "learning_rate": 6.754453743761824e-08, "epoch": 0.9740172861309572, "percentage": 97.41, "elapsed_time": "23:13:35", "remaining_time": "0:37:03"}
4551
+ {"current_steps": 4551, "total_steps": 4671, "loss": 0.7169, "learning_rate": 6.643332811656633e-08, "epoch": 0.9742313558641728, "percentage": 97.43, "elapsed_time": "23:13:53", "remaining_time": "0:36:45"}
4552
+ {"current_steps": 4552, "total_steps": 4671, "loss": 0.6747, "learning_rate": 6.533132009340026e-08, "epoch": 0.9744454255973883, "percentage": 97.45, "elapsed_time": "23:14:12", "remaining_time": "0:36:26"}
4553
+ {"current_steps": 4553, "total_steps": 4671, "loss": 0.6771, "learning_rate": 6.423851387680424e-08, "epoch": 0.9746594953306039, "percentage": 97.47, "elapsed_time": "23:14:30", "remaining_time": "0:36:08"}
4554
+ {"current_steps": 4554, "total_steps": 4671, "loss": 0.7015, "learning_rate": 6.315490997121698e-08, "epoch": 0.9748735650638195, "percentage": 97.5, "elapsed_time": "23:14:48", "remaining_time": "0:35:50"}
4555
+ {"current_steps": 4555, "total_steps": 4671, "loss": 0.718, "learning_rate": 6.208050887682727e-08, "epoch": 0.9750876347970351, "percentage": 97.52, "elapsed_time": "23:15:07", "remaining_time": "0:35:31"}
4556
+ {"current_steps": 4556, "total_steps": 4671, "loss": 0.686, "learning_rate": 6.101531108957614e-08, "epoch": 0.9753017045302508, "percentage": 97.54, "elapsed_time": "23:15:25", "remaining_time": "0:35:13"}
4557
+ {"current_steps": 4557, "total_steps": 4671, "loss": 0.6844, "learning_rate": 5.995931710115921e-08, "epoch": 0.9755157742634664, "percentage": 97.56, "elapsed_time": "23:15:43", "remaining_time": "0:34:54"}
4558
+ {"current_steps": 4558, "total_steps": 4671, "loss": 0.6894, "learning_rate": 5.891252739901765e-08, "epoch": 0.975729843996682, "percentage": 97.58, "elapsed_time": "23:16:02", "remaining_time": "0:34:36"}
4559
+ {"current_steps": 4559, "total_steps": 4671, "loss": 0.7049, "learning_rate": 5.787494246635161e-08, "epoch": 0.9759439137298975, "percentage": 97.6, "elapsed_time": "23:16:20", "remaining_time": "0:34:18"}
4560
+ {"current_steps": 4560, "total_steps": 4671, "loss": 0.6666, "learning_rate": 5.684656278210687e-08, "epoch": 0.9761579834631131, "percentage": 97.62, "elapsed_time": "23:16:38", "remaining_time": "0:33:59"}
4561
+ {"current_steps": 4561, "total_steps": 4671, "loss": 0.6831, "learning_rate": 5.5827388820979265e-08, "epoch": 0.9763720531963287, "percentage": 97.65, "elapsed_time": "23:16:57", "remaining_time": "0:33:41"}
4562
+ {"current_steps": 4562, "total_steps": 4671, "loss": 0.6602, "learning_rate": 5.481742105342136e-08, "epoch": 0.9765861229295443, "percentage": 97.67, "elapsed_time": "23:17:15", "remaining_time": "0:33:23"}
4563
+ {"current_steps": 4563, "total_steps": 4671, "loss": 0.6836, "learning_rate": 5.3816659945631346e-08, "epoch": 0.9768001926627599, "percentage": 97.69, "elapsed_time": "23:17:33", "remaining_time": "0:33:04"}
4564
+ {"current_steps": 4564, "total_steps": 4671, "loss": 0.6942, "learning_rate": 5.282510595955748e-08, "epoch": 0.9770142623959754, "percentage": 97.71, "elapsed_time": "23:17:52", "remaining_time": "0:32:46"}
4565
+ {"current_steps": 4565, "total_steps": 4671, "loss": 0.6698, "learning_rate": 5.18427595529003e-08, "epoch": 0.9772283321291911, "percentage": 97.73, "elapsed_time": "23:18:10", "remaining_time": "0:32:27"}
4566
+ {"current_steps": 4566, "total_steps": 4671, "loss": 0.6618, "learning_rate": 5.086962117910821e-08, "epoch": 0.9774424018624067, "percentage": 97.75, "elapsed_time": "23:18:29", "remaining_time": "0:32:09"}
4567
+ {"current_steps": 4567, "total_steps": 4671, "loss": 0.6799, "learning_rate": 4.990569128737965e-08, "epoch": 0.9776564715956223, "percentage": 97.77, "elapsed_time": "23:18:47", "remaining_time": "0:31:51"}
4568
+ {"current_steps": 4568, "total_steps": 4671, "loss": 0.6854, "learning_rate": 4.895097032266538e-08, "epoch": 0.9778705413288379, "percentage": 97.79, "elapsed_time": "23:19:05", "remaining_time": "0:31:32"}
4569
+ {"current_steps": 4569, "total_steps": 4671, "loss": 0.6907, "learning_rate": 4.800545872566176e-08, "epoch": 0.9780846110620535, "percentage": 97.82, "elapsed_time": "23:19:24", "remaining_time": "0:31:14"}
4570
+ {"current_steps": 4570, "total_steps": 4671, "loss": 0.6945, "learning_rate": 4.7069156932813e-08, "epoch": 0.978298680795269, "percentage": 97.84, "elapsed_time": "23:19:42", "remaining_time": "0:30:56"}
4571
+ {"current_steps": 4571, "total_steps": 4671, "loss": 0.6792, "learning_rate": 4.614206537631783e-08, "epoch": 0.9785127505284846, "percentage": 97.86, "elapsed_time": "23:20:00", "remaining_time": "0:30:37"}
4572
+ {"current_steps": 4572, "total_steps": 4671, "loss": 0.6971, "learning_rate": 4.522418448411614e-08, "epoch": 0.9787268202617002, "percentage": 97.88, "elapsed_time": "23:20:19", "remaining_time": "0:30:19"}
4573
+ {"current_steps": 4573, "total_steps": 4671, "loss": 0.6806, "learning_rate": 4.431551467990458e-08, "epoch": 0.9789408899949158, "percentage": 97.9, "elapsed_time": "23:20:37", "remaining_time": "0:30:00"}
4574
+ {"current_steps": 4574, "total_steps": 4671, "loss": 0.7087, "learning_rate": 4.3416056383120964e-08, "epoch": 0.9791549597281315, "percentage": 97.92, "elapsed_time": "23:20:55", "remaining_time": "0:29:42"}
4575
+ {"current_steps": 4575, "total_steps": 4671, "loss": 0.672, "learning_rate": 4.252581000895095e-08, "epoch": 0.9793690294613471, "percentage": 97.94, "elapsed_time": "23:21:14", "remaining_time": "0:29:24"}
4576
+ {"current_steps": 4576, "total_steps": 4671, "loss": 0.7196, "learning_rate": 4.164477596833694e-08, "epoch": 0.9795830991945627, "percentage": 97.97, "elapsed_time": "23:21:32", "remaining_time": "0:29:05"}
4577
+ {"current_steps": 4577, "total_steps": 4671, "loss": 0.6767, "learning_rate": 4.0772954667958055e-08, "epoch": 0.9797971689277782, "percentage": 97.99, "elapsed_time": "23:21:50", "remaining_time": "0:28:47"}
4578
+ {"current_steps": 4578, "total_steps": 4671, "loss": 0.7028, "learning_rate": 3.991034651024572e-08, "epoch": 0.9800112386609938, "percentage": 98.01, "elapsed_time": "23:22:09", "remaining_time": "0:28:29"}
4579
+ {"current_steps": 4579, "total_steps": 4671, "loss": 0.6947, "learning_rate": 3.905695189337921e-08, "epoch": 0.9802253083942094, "percentage": 98.03, "elapsed_time": "23:22:27", "remaining_time": "0:28:10"}
4580
+ {"current_steps": 4580, "total_steps": 4671, "loss": 0.6691, "learning_rate": 3.821277121128342e-08, "epoch": 0.980439378127425, "percentage": 98.05, "elapsed_time": "23:22:46", "remaining_time": "0:27:52"}
4581
+ {"current_steps": 4581, "total_steps": 4671, "loss": 0.6888, "learning_rate": 3.737780485363107e-08, "epoch": 0.9806534478606406, "percentage": 98.07, "elapsed_time": "23:23:04", "remaining_time": "0:27:33"}
4582
+ {"current_steps": 4582, "total_steps": 4671, "loss": 0.691, "learning_rate": 3.6552053205842766e-08, "epoch": 0.9808675175938562, "percentage": 98.09, "elapsed_time": "23:23:22", "remaining_time": "0:27:15"}
4583
+ {"current_steps": 4583, "total_steps": 4671, "loss": 0.7123, "learning_rate": 3.5735516649080257e-08, "epoch": 0.9810815873270718, "percentage": 98.12, "elapsed_time": "23:23:40", "remaining_time": "0:26:57"}
4584
+ {"current_steps": 4584, "total_steps": 4671, "loss": 0.6789, "learning_rate": 3.4928195560257614e-08, "epoch": 0.9812956570602874, "percentage": 98.14, "elapsed_time": "23:23:59", "remaining_time": "0:26:38"}
4585
+ {"current_steps": 4585, "total_steps": 4671, "loss": 0.701, "learning_rate": 3.413009031203229e-08, "epoch": 0.981509726793503, "percentage": 98.16, "elapsed_time": "23:24:17", "remaining_time": "0:26:20"}
4586
+ {"current_steps": 4586, "total_steps": 4671, "loss": 0.6722, "learning_rate": 3.334120127280738e-08, "epoch": 0.9817237965267186, "percentage": 98.18, "elapsed_time": "23:24:36", "remaining_time": "0:26:02"}
4587
+ {"current_steps": 4587, "total_steps": 4671, "loss": 0.7032, "learning_rate": 3.256152880673602e-08, "epoch": 0.9819378662599342, "percentage": 98.2, "elapsed_time": "23:24:55", "remaining_time": "0:25:43"}
4588
+ {"current_steps": 4588, "total_steps": 4671, "loss": 0.6785, "learning_rate": 3.179107327370812e-08, "epoch": 0.9821519359931498, "percentage": 98.22, "elapsed_time": "23:25:14", "remaining_time": "0:25:25"}
4589
+ {"current_steps": 4589, "total_steps": 4671, "loss": 0.6929, "learning_rate": 3.102983502937029e-08, "epoch": 0.9823660057263653, "percentage": 98.24, "elapsed_time": "23:25:33", "remaining_time": "0:25:06"}
4590
+ {"current_steps": 4590, "total_steps": 4671, "loss": 0.6589, "learning_rate": 3.027781442510369e-08, "epoch": 0.9825800754595809, "percentage": 98.27, "elapsed_time": "23:25:52", "remaining_time": "0:24:48"}
4591
+ {"current_steps": 4591, "total_steps": 4671, "loss": 0.6876, "learning_rate": 2.9535011808043967e-08, "epoch": 0.9827941451927965, "percentage": 98.29, "elapsed_time": "23:26:10", "remaining_time": "0:24:30"}
4592
+ {"current_steps": 4592, "total_steps": 4671, "loss": 0.6623, "learning_rate": 2.880142752106574e-08, "epoch": 0.9830082149260122, "percentage": 98.31, "elapsed_time": "23:26:29", "remaining_time": "0:24:11"}
4593
+ {"current_steps": 4593, "total_steps": 4671, "loss": 0.6812, "learning_rate": 2.8077061902787028e-08, "epoch": 0.9832222846592278, "percentage": 98.33, "elapsed_time": "23:26:47", "remaining_time": "0:23:53"}
4594
+ {"current_steps": 4594, "total_steps": 4671, "loss": 0.6596, "learning_rate": 2.7361915287578144e-08, "epoch": 0.9834363543924434, "percentage": 98.35, "elapsed_time": "23:27:06", "remaining_time": "0:23:35"}
4595
+ {"current_steps": 4595, "total_steps": 4671, "loss": 0.6826, "learning_rate": 2.665598800554836e-08, "epoch": 0.983650424125659, "percentage": 98.37, "elapsed_time": "23:27:24", "remaining_time": "0:23:16"}
4596
+ {"current_steps": 4596, "total_steps": 4671, "loss": 0.6894, "learning_rate": 2.5959280382550355e-08, "epoch": 0.9838644938588745, "percentage": 98.39, "elapsed_time": "23:27:42", "remaining_time": "0:22:58"}
4597
+ {"current_steps": 4597, "total_steps": 4671, "loss": 0.6654, "learning_rate": 2.5271792740186874e-08, "epoch": 0.9840785635920901, "percentage": 98.42, "elapsed_time": "23:28:01", "remaining_time": "0:22:39"}
4598
+ {"current_steps": 4598, "total_steps": 4671, "loss": 0.6888, "learning_rate": 2.4593525395797402e-08, "epoch": 0.9842926333253057, "percentage": 98.44, "elapsed_time": "23:28:19", "remaining_time": "0:22:21"}
4599
+ {"current_steps": 4599, "total_steps": 4671, "loss": 0.7035, "learning_rate": 2.3924478662469275e-08, "epoch": 0.9845067030585213, "percentage": 98.46, "elapsed_time": "23:28:38", "remaining_time": "0:22:03"}
4600
+ {"current_steps": 4600, "total_steps": 4671, "loss": 0.6904, "learning_rate": 2.326465284903545e-08, "epoch": 0.9847207727917369, "percentage": 98.48, "elapsed_time": "23:28:56", "remaining_time": "0:21:44"}
4601
+ {"current_steps": 4601, "total_steps": 4671, "loss": 0.6757, "learning_rate": 2.2614048260067856e-08, "epoch": 0.9849348425249526, "percentage": 98.5, "elapsed_time": "23:29:14", "remaining_time": "0:21:26"}
4602
+ {"current_steps": 4602, "total_steps": 4671, "loss": 0.6883, "learning_rate": 2.1972665195886256e-08, "epoch": 0.9851489122581681, "percentage": 98.52, "elapsed_time": "23:29:33", "remaining_time": "0:21:08"}
4603
+ {"current_steps": 4603, "total_steps": 4671, "loss": 0.69, "learning_rate": 2.1340503952551606e-08, "epoch": 0.9853629819913837, "percentage": 98.54, "elapsed_time": "23:29:51", "remaining_time": "0:20:49"}
4604
+ {"current_steps": 4604, "total_steps": 4671, "loss": 0.7155, "learning_rate": 2.0717564821868264e-08, "epoch": 0.9855770517245993, "percentage": 98.57, "elapsed_time": "23:30:10", "remaining_time": "0:20:31"}
4605
+ {"current_steps": 4605, "total_steps": 4671, "loss": 0.6773, "learning_rate": 2.0103848091381773e-08, "epoch": 0.9857911214578149, "percentage": 98.59, "elapsed_time": "23:30:28", "remaining_time": "0:20:12"}
4606
+ {"current_steps": 4606, "total_steps": 4671, "loss": 0.6888, "learning_rate": 1.949935404438552e-08, "epoch": 0.9860051911910305, "percentage": 98.61, "elapsed_time": "23:30:46", "remaining_time": "0:19:54"}
4607
+ {"current_steps": 4607, "total_steps": 4671, "loss": 0.6626, "learning_rate": 1.890408295990964e-08, "epoch": 0.986219260924246, "percentage": 98.63, "elapsed_time": "23:31:05", "remaining_time": "0:19:36"}
4608
+ {"current_steps": 4608, "total_steps": 4671, "loss": 0.6882, "learning_rate": 1.8318035112734335e-08, "epoch": 0.9864333306574616, "percentage": 98.65, "elapsed_time": "23:31:23", "remaining_time": "0:19:17"}
4609
+ {"current_steps": 4609, "total_steps": 4671, "loss": 0.6898, "learning_rate": 1.7741210773376538e-08, "epoch": 0.9866474003906772, "percentage": 98.67, "elapsed_time": "23:31:41", "remaining_time": "0:18:59"}
4610
+ {"current_steps": 4610, "total_steps": 4671, "loss": 0.656, "learning_rate": 1.7173610208096603e-08, "epoch": 0.9868614701238928, "percentage": 98.69, "elapsed_time": "23:32:00", "remaining_time": "0:18:41"}
4611
+ {"current_steps": 4611, "total_steps": 4671, "loss": 0.6772, "learning_rate": 1.661523367889606e-08, "epoch": 0.9870755398571085, "percentage": 98.72, "elapsed_time": "23:32:18", "remaining_time": "0:18:22"}
4612
+ {"current_steps": 4612, "total_steps": 4671, "loss": 0.7211, "learning_rate": 1.6066081443524284e-08, "epoch": 0.9872896095903241, "percentage": 98.74, "elapsed_time": "23:32:37", "remaining_time": "0:18:04"}
4613
+ {"current_steps": 4613, "total_steps": 4671, "loss": 0.6624, "learning_rate": 1.55261537554674e-08, "epoch": 0.9875036793235397, "percentage": 98.76, "elapsed_time": "23:32:55", "remaining_time": "0:17:45"}
4614
+ {"current_steps": 4614, "total_steps": 4671, "loss": 0.6876, "learning_rate": 1.499545086395493e-08, "epoch": 0.9877177490567552, "percentage": 98.78, "elapsed_time": "23:33:13", "remaining_time": "0:17:27"}
4615
+ {"current_steps": 4615, "total_steps": 4671, "loss": 0.6934, "learning_rate": 1.4473973013957587e-08, "epoch": 0.9879318187899708, "percentage": 98.8, "elapsed_time": "23:33:32", "remaining_time": "0:17:09"}
4616
+ {"current_steps": 4616, "total_steps": 4671, "loss": 0.7093, "learning_rate": 1.3961720446191707e-08, "epoch": 0.9881458885231864, "percentage": 98.82, "elapsed_time": "23:33:50", "remaining_time": "0:16:50"}
4617
+ {"current_steps": 4617, "total_steps": 4671, "loss": 0.6757, "learning_rate": 1.3458693397105926e-08, "epoch": 0.988359958256402, "percentage": 98.84, "elapsed_time": "23:34:08", "remaining_time": "0:16:32"}
4618
+ {"current_steps": 4618, "total_steps": 4671, "loss": 0.6857, "learning_rate": 1.2964892098903393e-08, "epoch": 0.9885740279896176, "percentage": 98.87, "elapsed_time": "23:34:27", "remaining_time": "0:16:14"}
4619
+ {"current_steps": 4619, "total_steps": 4671, "loss": 0.7003, "learning_rate": 1.2480316779517332e-08, "epoch": 0.9887880977228332, "percentage": 98.89, "elapsed_time": "23:34:45", "remaining_time": "0:15:55"}
4620
+ {"current_steps": 4620, "total_steps": 4671, "loss": 0.6971, "learning_rate": 1.2004967662628819e-08, "epoch": 0.9890021674560489, "percentage": 98.91, "elapsed_time": "23:35:04", "remaining_time": "0:15:37"}
4621
+ {"current_steps": 4621, "total_steps": 4671, "loss": 0.6693, "learning_rate": 1.1538844967660112e-08, "epoch": 0.9892162371892644, "percentage": 98.93, "elapsed_time": "23:35:22", "remaining_time": "0:15:18"}
4622
+ {"current_steps": 4622, "total_steps": 4671, "loss": 0.6588, "learning_rate": 1.1081948909767992e-08, "epoch": 0.98943030692248, "percentage": 98.95, "elapsed_time": "23:35:40", "remaining_time": "0:15:00"}
4623
+ {"current_steps": 4623, "total_steps": 4671, "loss": 0.6686, "learning_rate": 1.0634279699857086e-08, "epoch": 0.9896443766556956, "percentage": 98.97, "elapsed_time": "23:35:59", "remaining_time": "0:14:42"}
4624
+ {"current_steps": 4624, "total_steps": 4671, "loss": 0.6897, "learning_rate": 1.0195837544570986e-08, "epoch": 0.9898584463889112, "percentage": 98.99, "elapsed_time": "23:36:17", "remaining_time": "0:14:23"}
4625
+ {"current_steps": 4625, "total_steps": 4671, "loss": 0.6883, "learning_rate": 9.766622646292246e-09, "epoch": 0.9900725161221268, "percentage": 99.02, "elapsed_time": "23:36:36", "remaining_time": "0:14:05"}
4626
+ {"current_steps": 4626, "total_steps": 4671, "loss": 0.6952, "learning_rate": 9.346635203149046e-09, "epoch": 0.9902865858553423, "percentage": 99.04, "elapsed_time": "23:36:54", "remaining_time": "0:13:46"}
4627
+ {"current_steps": 4627, "total_steps": 4671, "loss": 0.7011, "learning_rate": 8.93587540900409e-09, "epoch": 0.9905006555885579, "percentage": 99.06, "elapsed_time": "23:37:12", "remaining_time": "0:13:28"}
4628
+ {"current_steps": 4628, "total_steps": 4671, "loss": 0.6856, "learning_rate": 8.53434345346349e-09, "epoch": 0.9907147253217735, "percentage": 99.08, "elapsed_time": "23:37:31", "remaining_time": "0:13:10"}
4629
+ {"current_steps": 4629, "total_steps": 4671, "loss": 0.7048, "learning_rate": 8.142039521874534e-09, "epoch": 0.9909287950549892, "percentage": 99.1, "elapsed_time": "23:37:49", "remaining_time": "0:12:51"}
4630
+ {"current_steps": 4630, "total_steps": 4671, "loss": 0.7063, "learning_rate": 7.758963795321262e-09, "epoch": 0.9911428647882048, "percentage": 99.12, "elapsed_time": "23:38:07", "remaining_time": "0:12:33"}
4631
+ {"current_steps": 4631, "total_steps": 4671, "loss": 0.6911, "learning_rate": 7.385116450635555e-09, "epoch": 0.9913569345214204, "percentage": 99.14, "elapsed_time": "23:38:26", "remaining_time": "0:12:15"}
4632
+ {"current_steps": 4632, "total_steps": 4671, "loss": 0.6892, "learning_rate": 7.020497660381598e-09, "epoch": 0.991571004254636, "percentage": 99.17, "elapsed_time": "23:38:44", "remaining_time": "0:11:56"}
4633
+ {"current_steps": 4633, "total_steps": 4671, "loss": 0.6951, "learning_rate": 6.665107592866982e-09, "epoch": 0.9917850739878515, "percentage": 99.19, "elapsed_time": "23:39:03", "remaining_time": "0:11:38"}
4634
+ {"current_steps": 4634, "total_steps": 4671, "loss": 0.7092, "learning_rate": 6.318946412140481e-09, "epoch": 0.9919991437210671, "percentage": 99.21, "elapsed_time": "23:39:21", "remaining_time": "0:11:19"}
4635
+ {"current_steps": 4635, "total_steps": 4671, "loss": 0.6828, "learning_rate": 5.982014277987614e-09, "epoch": 0.9922132134542827, "percentage": 99.23, "elapsed_time": "23:39:39", "remaining_time": "0:11:01"}
4636
+ {"current_steps": 4636, "total_steps": 4671, "loss": 0.697, "learning_rate": 5.654311345937302e-09, "epoch": 0.9924272831874983, "percentage": 99.25, "elapsed_time": "23:39:58", "remaining_time": "0:10:43"}
4637
+ {"current_steps": 4637, "total_steps": 4671, "loss": 0.6745, "learning_rate": 5.335837767255214e-09, "epoch": 0.9926413529207139, "percentage": 99.27, "elapsed_time": "23:40:17", "remaining_time": "0:10:24"}
4638
+ {"current_steps": 4638, "total_steps": 4671, "loss": 0.7088, "learning_rate": 5.0265936889482e-09, "epoch": 0.9928554226539296, "percentage": 99.29, "elapsed_time": "23:40:35", "remaining_time": "0:10:06"}
4639
+ {"current_steps": 4639, "total_steps": 4671, "loss": 0.6977, "learning_rate": 4.726579253764296e-09, "epoch": 0.9930694923871451, "percentage": 99.31, "elapsed_time": "23:40:54", "remaining_time": "0:09:48"}
4640
+ {"current_steps": 4640, "total_steps": 4671, "loss": 0.6939, "learning_rate": 4.435794600188281e-09, "epoch": 0.9932835621203607, "percentage": 99.34, "elapsed_time": "23:41:12", "remaining_time": "0:09:29"}
4641
+ {"current_steps": 4641, "total_steps": 4671, "loss": 0.6735, "learning_rate": 4.154239862446119e-09, "epoch": 0.9934976318535763, "percentage": 99.36, "elapsed_time": "23:41:31", "remaining_time": "0:09:11"}
4642
+ {"current_steps": 4642, "total_steps": 4671, "loss": 0.676, "learning_rate": 3.881915170502737e-09, "epoch": 0.9937117015867919, "percentage": 99.38, "elapsed_time": "23:41:49", "remaining_time": "0:08:52"}
4643
+ {"current_steps": 4643, "total_steps": 4671, "loss": 0.6977, "learning_rate": 3.6188206500620273e-09, "epoch": 0.9939257713200075, "percentage": 99.4, "elapsed_time": "23:42:07", "remaining_time": "0:08:34"}
4644
+ {"current_steps": 4644, "total_steps": 4671, "loss": 0.6772, "learning_rate": 3.3649564225690655e-09, "epoch": 0.9941398410532231, "percentage": 99.42, "elapsed_time": "23:42:26", "remaining_time": "0:08:16"}
4645
+ {"current_steps": 4645, "total_steps": 4671, "loss": 0.6993, "learning_rate": 3.1203226052078926e-09, "epoch": 0.9943539107864386, "percentage": 99.44, "elapsed_time": "23:42:44", "remaining_time": "0:07:57"}
4646
+ {"current_steps": 4646, "total_steps": 4671, "loss": 0.7144, "learning_rate": 2.8849193109015127e-09, "epoch": 0.9945679805196542, "percentage": 99.46, "elapsed_time": "23:43:02", "remaining_time": "0:07:39"}
4647
+ {"current_steps": 4647, "total_steps": 4671, "loss": 0.7093, "learning_rate": 2.658746648307453e-09, "epoch": 0.9947820502528699, "percentage": 99.49, "elapsed_time": "23:43:21", "remaining_time": "0:07:21"}
4648
+ {"current_steps": 4648, "total_steps": 4671, "loss": 0.6689, "learning_rate": 2.441804721831087e-09, "epoch": 0.9949961199860855, "percentage": 99.51, "elapsed_time": "23:43:39", "remaining_time": "0:07:02"}
4649
+ {"current_steps": 4649, "total_steps": 4671, "loss": 0.6726, "learning_rate": 2.2340936316100904e-09, "epoch": 0.9952101897193011, "percentage": 99.53, "elapsed_time": "23:43:58", "remaining_time": "0:06:44"}
4650
+ {"current_steps": 4650, "total_steps": 4671, "loss": 0.6944, "learning_rate": 2.0356134735233234e-09, "epoch": 0.9954242594525167, "percentage": 99.55, "elapsed_time": "23:44:16", "remaining_time": "0:06:25"}
4651
+ {"current_steps": 4651, "total_steps": 4671, "loss": 0.7099, "learning_rate": 1.8463643391908314e-09, "epoch": 0.9956383291857323, "percentage": 99.57, "elapsed_time": "23:44:34", "remaining_time": "0:06:07"}
4652
+ {"current_steps": 4652, "total_steps": 4671, "loss": 0.678, "learning_rate": 1.6663463159671821e-09, "epoch": 0.9958523989189478, "percentage": 99.59, "elapsed_time": "23:44:53", "remaining_time": "0:05:49"}
4653
+ {"current_steps": 4653, "total_steps": 4671, "loss": 0.671, "learning_rate": 1.4955594869525692e-09, "epoch": 0.9960664686521634, "percentage": 99.61, "elapsed_time": "23:45:11", "remaining_time": "0:05:30"}
4654
+ {"current_steps": 4654, "total_steps": 4671, "loss": 0.6952, "learning_rate": 1.3340039309750475e-09, "epoch": 0.996280538385379, "percentage": 99.64, "elapsed_time": "23:45:29", "remaining_time": "0:05:12"}
4655
+ {"current_steps": 4655, "total_steps": 4671, "loss": 0.7047, "learning_rate": 1.181679722614959e-09, "epoch": 0.9964946081185946, "percentage": 99.66, "elapsed_time": "23:45:48", "remaining_time": "0:04:54"}
4656
+ {"current_steps": 4656, "total_steps": 4671, "loss": 0.6706, "learning_rate": 1.038586932182728e-09, "epoch": 0.9967086778518103, "percentage": 99.68, "elapsed_time": "23:46:06", "remaining_time": "0:04:35"}
4657
+ {"current_steps": 4657, "total_steps": 4671, "loss": 0.6837, "learning_rate": 9.047256257277426e-10, "epoch": 0.9969227475850259, "percentage": 99.7, "elapsed_time": "23:46:25", "remaining_time": "0:04:17"}
4658
+ {"current_steps": 4658, "total_steps": 4671, "loss": 0.7018, "learning_rate": 7.800958650405754e-10, "epoch": 0.9971368173182414, "percentage": 99.72, "elapsed_time": "23:46:43", "remaining_time": "0:03:58"}
4659
+ {"current_steps": 4659, "total_steps": 4671, "loss": 0.6969, "learning_rate": 6.646977076529837e-10, "epoch": 0.997350887051457, "percentage": 99.74, "elapsed_time": "23:47:01", "remaining_time": "0:03:40"}
4660
+ {"current_steps": 4660, "total_steps": 4671, "loss": 0.6465, "learning_rate": 5.585312068312476e-10, "epoch": 0.9975649567846726, "percentage": 99.76, "elapsed_time": "23:47:20", "remaining_time": "0:03:22"}
4661
+ {"current_steps": 4661, "total_steps": 4671, "loss": 0.7069, "learning_rate": 4.6159641157839107e-10, "epoch": 0.9977790265178882, "percentage": 99.79, "elapsed_time": "23:47:38", "remaining_time": "0:03:03"}
4662
+ {"current_steps": 4662, "total_steps": 4671, "loss": 0.6816, "learning_rate": 3.738933666430633e-10, "epoch": 0.9979930962511038, "percentage": 99.81, "elapsed_time": "23:47:56", "remaining_time": "0:02:45"}
4663
+ {"current_steps": 4663, "total_steps": 4671, "loss": 0.6965, "learning_rate": 2.954221125084367e-10, "epoch": 0.9982071659843194, "percentage": 99.83, "elapsed_time": "23:48:15", "remaining_time": "0:02:27"}
4664
+ {"current_steps": 4664, "total_steps": 4671, "loss": 0.6604, "learning_rate": 2.2618268539664756e-10, "epoch": 0.9984212357175349, "percentage": 99.85, "elapsed_time": "23:48:33", "remaining_time": "0:02:08"}
4665
+ {"current_steps": 4665, "total_steps": 4671, "loss": 0.6893, "learning_rate": 1.6617511726657597e-10, "epoch": 0.9986353054507506, "percentage": 99.87, "elapsed_time": "23:48:52", "remaining_time": "0:01:50"}
4666
+ {"current_steps": 4666, "total_steps": 4671, "loss": 0.6664, "learning_rate": 1.1539943582050683e-10, "epoch": 0.9988493751839662, "percentage": 99.89, "elapsed_time": "23:49:10", "remaining_time": "0:01:31"}
4667
+ {"current_steps": 4667, "total_steps": 4671, "loss": 0.6659, "learning_rate": 7.385566449302773e-11, "epoch": 0.9990634449171818, "percentage": 99.91, "elapsed_time": "23:49:28", "remaining_time": "0:01:13"}
4668
+ {"current_steps": 4668, "total_steps": 4671, "loss": 0.6698, "learning_rate": 4.154382246435162e-11, "epoch": 0.9992775146503974, "percentage": 99.94, "elapsed_time": "23:49:47", "remaining_time": "0:00:55"}
4669
+ {"current_steps": 4669, "total_steps": 4671, "loss": 0.6786, "learning_rate": 1.8463924646994202e-11, "epoch": 0.999491584383613, "percentage": 99.96, "elapsed_time": "23:50:05", "remaining_time": "0:00:36"}
4670
+ {"current_steps": 4670, "total_steps": 4671, "loss": 0.6913, "learning_rate": 4.615981694655603e-12, "epoch": 0.9997056541168285, "percentage": 99.98, "elapsed_time": "23:50:23", "remaining_time": "0:00:18"}
4671
+ {"current_steps": 4671, "total_steps": 4671, "loss": 0.6768, "learning_rate": 0.0, "epoch": 0.9999197238500441, "percentage": 100.0, "elapsed_time": "23:50:42", "remaining_time": "0:00:00"}
4672
+ {"current_steps": 4671, "total_steps": 4671, "epoch": 0.9999197238500441, "percentage": 100.0, "elapsed_time": "23:51:09", "remaining_time": "0:00:00"}