{"current_steps": 2, "total_steps": 408, "loss": 0.6931, "accuracy": 0.0, "learning_rate": 2.439024390243903e-07, "epoch": 0.014678899082568808, "percentage": 0.49, "elapsed_time": "0:00:31", "remaining_time": "1:47:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4, "total_steps": 408, "loss": 0.6923, "accuracy": 0.59375, "learning_rate": 4.878048780487805e-07, "epoch": 0.029357798165137616, "percentage": 0.98, "elapsed_time": "0:01:20", "remaining_time": "2:15:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6, "total_steps": 408, "loss": 0.693, "accuracy": 0.546875, "learning_rate": 7.317073170731707e-07, "epoch": 0.044036697247706424, "percentage": 1.47, "elapsed_time": "0:02:07", "remaining_time": "2:22:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8, "total_steps": 408, "loss": 0.6924, "accuracy": 0.515625, "learning_rate": 9.75609756097561e-07, "epoch": 0.05871559633027523, "percentage": 1.96, "elapsed_time": "0:02:39", "remaining_time": "2:13:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10, "total_steps": 408, "loss": 0.6924, "accuracy": 0.59375, "learning_rate": 1.2195121951219514e-06, "epoch": 0.07339449541284404, "percentage": 2.45, "elapsed_time": "0:03:23", "remaining_time": "2:14:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12, "total_steps": 408, "loss": 0.6934, "accuracy": 0.46875, "learning_rate": 1.4634146341463414e-06, "epoch": 0.08807339449541285, "percentage": 2.94, "elapsed_time": "0:03:58", "remaining_time": "2:11:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14, "total_steps": 408, "loss": 0.6932, "accuracy": 0.484375, "learning_rate": 1.707317073170732e-06, "epoch": 0.10275229357798166, "percentage": 3.43, "elapsed_time": "0:04:31", "remaining_time": "2:07:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16, "total_steps": 408, "loss": 0.6928, "accuracy": 0.53125, "learning_rate": 1.951219512195122e-06, "epoch": 0.11743119266055047, "percentage": 3.92, "elapsed_time": "0:05:07", "remaining_time": "2:05:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 18, "total_steps": 408, "loss": 0.6923, "accuracy": 0.625, "learning_rate": 2.1951219512195125e-06, "epoch": 0.13211009174311927, "percentage": 4.41, "elapsed_time": "0:05:45", "remaining_time": "2:04:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 20, "total_steps": 408, "loss": 0.6934, "accuracy": 0.421875, "learning_rate": 2.4390243902439027e-06, "epoch": 0.14678899082568808, "percentage": 4.9, "elapsed_time": "0:06:27", "remaining_time": "2:05:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 22, "total_steps": 408, "loss": 0.6933, "accuracy": 0.484375, "learning_rate": 2.682926829268293e-06, "epoch": 0.1614678899082569, "percentage": 5.39, "elapsed_time": "0:07:16", "remaining_time": "2:07:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 24, "total_steps": 408, "loss": 0.693, "accuracy": 0.546875, "learning_rate": 2.926829268292683e-06, "epoch": 0.1761467889908257, "percentage": 5.88, "elapsed_time": "0:07:49", "remaining_time": "2:05:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 26, "total_steps": 408, "loss": 0.6929, "accuracy": 0.5625, "learning_rate": 3.1707317073170736e-06, "epoch": 0.1908256880733945, "percentage": 6.37, "elapsed_time": "0:08:26", "remaining_time": "2:03:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 28, "total_steps": 408, "loss": 0.6931, "accuracy": 0.453125, "learning_rate": 3.414634146341464e-06, "epoch": 0.20550458715596331, "percentage": 6.86, "elapsed_time": "0:09:05", "remaining_time": "2:03:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 30, "total_steps": 408, "loss": 0.693, "accuracy": 0.4375, "learning_rate": 3.6585365853658537e-06, "epoch": 0.22018348623853212, "percentage": 7.35, "elapsed_time": "0:09:42", "remaining_time": "2:02:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 32, "total_steps": 408, "loss": 0.6928, "accuracy": 0.5, "learning_rate": 3.902439024390244e-06, "epoch": 0.23486238532110093, "percentage": 7.84, "elapsed_time": "0:10:31", "remaining_time": "2:03:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 34, "total_steps": 408, "loss": 0.6922, "accuracy": 0.5625, "learning_rate": 4.146341463414634e-06, "epoch": 0.24954128440366974, "percentage": 8.33, "elapsed_time": "0:11:18", "remaining_time": "2:04:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 36, "total_steps": 408, "loss": 0.6921, "accuracy": 0.640625, "learning_rate": 4.390243902439025e-06, "epoch": 0.26422018348623855, "percentage": 8.82, "elapsed_time": "0:12:06", "remaining_time": "2:05:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 38, "total_steps": 408, "loss": 0.692, "accuracy": 0.59375, "learning_rate": 4.634146341463416e-06, "epoch": 0.27889908256880735, "percentage": 9.31, "elapsed_time": "0:12:46", "remaining_time": "2:04:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 40, "total_steps": 408, "loss": 0.6912, "accuracy": 0.703125, "learning_rate": 4.8780487804878055e-06, "epoch": 0.29357798165137616, "percentage": 9.8, "elapsed_time": "0:13:22", "remaining_time": "2:02:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 42, "total_steps": 408, "loss": 0.6911, "accuracy": 0.71875, "learning_rate": 4.999908404322799e-06, "epoch": 0.30825688073394497, "percentage": 10.29, "elapsed_time": "0:13:58", "remaining_time": "2:01:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 44, "total_steps": 408, "loss": 0.6908, "accuracy": 0.703125, "learning_rate": 4.999175679175577e-06, "epoch": 0.3229357798165138, "percentage": 10.78, "elapsed_time": "0:14:36", "remaining_time": "2:00:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 46, "total_steps": 408, "loss": 0.6905, "accuracy": 0.671875, "learning_rate": 4.997710443643461e-06, "epoch": 0.3376146788990826, "percentage": 11.27, "elapsed_time": "0:15:34", "remaining_time": "2:02:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 48, "total_steps": 408, "loss": 0.6896, "accuracy": 0.8125, "learning_rate": 4.995513127188151e-06, "epoch": 0.3522935779816514, "percentage": 11.76, "elapsed_time": "0:16:22", "remaining_time": "2:02:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 50, "total_steps": 408, "loss": 0.6892, "accuracy": 0.8125, "learning_rate": 4.992584373844853e-06, "epoch": 0.3669724770642202, "percentage": 12.25, "elapsed_time": "0:17:01", "remaining_time": "2:01:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 52, "total_steps": 408, "loss": 0.6887, "accuracy": 0.875, "learning_rate": 4.98892504203351e-06, "epoch": 0.381651376146789, "percentage": 12.75, "elapsed_time": "0:17:37", "remaining_time": "2:00:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 54, "total_steps": 408, "loss": 0.6883, "accuracy": 0.890625, "learning_rate": 4.9845362043071925e-06, "epoch": 0.3963302752293578, "percentage": 13.24, "elapsed_time": "0:18:11", "remaining_time": "1:59:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 56, "total_steps": 408, "loss": 0.6876, "accuracy": 0.875, "learning_rate": 4.97941914703774e-06, "epoch": 0.41100917431192663, "percentage": 13.73, "elapsed_time": "0:19:00", "remaining_time": "1:59:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 58, "total_steps": 408, "loss": 0.6845, "accuracy": 0.921875, "learning_rate": 4.973575370038718e-06, "epoch": 0.42568807339449544, "percentage": 14.22, "elapsed_time": "0:19:43", "remaining_time": "1:59:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 60, "total_steps": 408, "loss": 0.6839, "accuracy": 0.96875, "learning_rate": 4.967006586125827e-06, "epoch": 0.44036697247706424, "percentage": 14.71, "elapsed_time": "0:20:21", "remaining_time": "1:58:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 62, "total_steps": 408, "loss": 0.6818, "accuracy": 0.984375, "learning_rate": 4.959714720614871e-06, "epoch": 0.45504587155963305, "percentage": 15.2, "elapsed_time": "0:21:11", "remaining_time": "1:58:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 64, "total_steps": 408, "loss": 0.6816, "accuracy": 0.96875, "learning_rate": 4.951701910757446e-06, "epoch": 0.46972477064220186, "percentage": 15.69, "elapsed_time": "0:21:51", "remaining_time": "1:57:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 66, "total_steps": 408, "loss": 0.6806, "accuracy": 0.984375, "learning_rate": 4.942970505114514e-06, "epoch": 0.48440366972477067, "percentage": 16.18, "elapsed_time": "0:22:24", "remaining_time": "1:56:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 68, "total_steps": 408, "loss": 0.6789, "accuracy": 0.984375, "learning_rate": 4.933523062868033e-06, "epoch": 0.4990825688073395, "percentage": 16.67, "elapsed_time": "0:22:57", "remaining_time": "1:54:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 70, "total_steps": 408, "loss": 0.6754, "accuracy": 0.984375, "learning_rate": 4.923362353070859e-06, "epoch": 0.5137614678899083, "percentage": 17.16, "elapsed_time": "0:23:33", "remaining_time": "1:53:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 72, "total_steps": 408, "loss": 0.6766, "accuracy": 0.984375, "learning_rate": 4.912491353835138e-06, "epoch": 0.5284403669724771, "percentage": 17.65, "elapsed_time": "0:24:22", "remaining_time": "1:53:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 74, "total_steps": 408, "loss": 0.6737, "accuracy": 1.0, "learning_rate": 4.900913251459418e-06, "epoch": 0.5431192660550459, "percentage": 18.14, "elapsed_time": "0:24:57", "remaining_time": "1:52:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 76, "total_steps": 408, "loss": 0.6685, "accuracy": 0.984375, "learning_rate": 4.8886314394947396e-06, "epoch": 0.5577981651376147, "percentage": 18.63, "elapsed_time": "0:25:30", "remaining_time": "1:51:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 78, "total_steps": 408, "loss": 0.6669, "accuracy": 0.96875, "learning_rate": 4.875649517749985e-06, "epoch": 0.5724770642201835, "percentage": 19.12, "elapsed_time": "0:26:02", "remaining_time": "1:50:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 80, "total_steps": 408, "loss": 0.6677, "accuracy": 0.953125, "learning_rate": 4.861971291236772e-06, "epoch": 0.5871559633027523, "percentage": 19.61, "elapsed_time": "0:26:39", "remaining_time": "1:49:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 82, "total_steps": 408, "loss": 0.6624, "accuracy": 0.953125, "learning_rate": 4.847600769054201e-06, "epoch": 0.6018348623853211, "percentage": 20.1, "elapsed_time": "0:27:24", "remaining_time": "1:48:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 84, "total_steps": 408, "loss": 0.6609, "accuracy": 0.984375, "learning_rate": 4.832542163213787e-06, "epoch": 0.6165137614678899, "percentage": 20.59, "elapsed_time": "0:27:58", "remaining_time": "1:47:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 86, "total_steps": 408, "loss": 0.6605, "accuracy": 0.984375, "learning_rate": 4.816799887404911e-06, "epoch": 0.6311926605504588, "percentage": 21.08, "elapsed_time": "0:28:44", "remaining_time": "1:47:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 88, "total_steps": 408, "loss": 0.6556, "accuracy": 0.984375, "learning_rate": 4.800378555701168e-06, "epoch": 0.6458715596330276, "percentage": 21.57, "elapsed_time": "0:29:22", "remaining_time": "1:46:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 90, "total_steps": 408, "loss": 0.6542, "accuracy": 0.96875, "learning_rate": 4.783282981207979e-06, "epoch": 0.6605504587155964, "percentage": 22.06, "elapsed_time": "0:30:01", "remaining_time": "1:46:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 92, "total_steps": 408, "loss": 0.6516, "accuracy": 0.96875, "learning_rate": 4.765518174651864e-06, "epoch": 0.6752293577981652, "percentage": 22.55, "elapsed_time": "0:30:36", "remaining_time": "1:45:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 94, "total_steps": 408, "loss": 0.6465, "accuracy": 1.0, "learning_rate": 4.747089342911793e-06, "epoch": 0.689908256880734, "percentage": 23.04, "elapsed_time": "0:31:21", "remaining_time": "1:44:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 96, "total_steps": 408, "loss": 0.6461, "accuracy": 0.96875, "learning_rate": 4.728001887493048e-06, "epoch": 0.7045871559633028, "percentage": 23.53, "elapsed_time": "0:31:55", "remaining_time": "1:43:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 98, "total_steps": 408, "loss": 0.6373, "accuracy": 0.984375, "learning_rate": 4.708261402944036e-06, "epoch": 0.7192660550458716, "percentage": 24.02, "elapsed_time": "0:32:36", "remaining_time": "1:43:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 100, "total_steps": 408, "loss": 0.6391, "accuracy": 0.953125, "learning_rate": 4.687873675216522e-06, "epoch": 0.7339449541284404, "percentage": 24.51, "elapsed_time": "0:33:21", "remaining_time": "1:42:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 102, "total_steps": 408, "loss": 0.6356, "accuracy": 1.0, "learning_rate": 4.666844679969765e-06, "epoch": 0.7486238532110092, "percentage": 25.0, "elapsed_time": "0:34:16", "remaining_time": "1:42:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 104, "total_steps": 408, "loss": 0.6312, "accuracy": 1.0, "learning_rate": 4.6451805808190464e-06, "epoch": 0.763302752293578, "percentage": 25.49, "elapsed_time": "0:34:50", "remaining_time": "1:41:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 106, "total_steps": 408, "loss": 0.6281, "accuracy": 1.0, "learning_rate": 4.622887727529104e-06, "epoch": 0.7779816513761468, "percentage": 25.98, "elapsed_time": "0:35:30", "remaining_time": "1:41:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 108, "total_steps": 408, "loss": 0.6238, "accuracy": 1.0, "learning_rate": 4.599972654153018e-06, "epoch": 0.7926605504587156, "percentage": 26.47, "elapsed_time": "0:36:01", "remaining_time": "1:40:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 110, "total_steps": 408, "loss": 0.6226, "accuracy": 1.0, "learning_rate": 4.5764420771170735e-06, "epoch": 0.8073394495412844, "percentage": 26.96, "elapsed_time": "0:36:32", "remaining_time": "1:38:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 112, "total_steps": 408, "loss": 0.6247, "accuracy": 1.0, "learning_rate": 4.552302893252166e-06, "epoch": 0.8220183486238533, "percentage": 27.45, "elapsed_time": "0:37:18", "remaining_time": "1:38:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 114, "total_steps": 408, "loss": 0.622, "accuracy": 1.0, "learning_rate": 4.52756217777234e-06, "epoch": 0.8366972477064221, "percentage": 27.94, "elapsed_time": "0:37:57", "remaining_time": "1:37:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 116, "total_steps": 408, "loss": 0.6151, "accuracy": 1.0, "learning_rate": 4.502227182201035e-06, "epoch": 0.8513761467889909, "percentage": 28.43, "elapsed_time": "0:38:31", "remaining_time": "1:36:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 118, "total_steps": 408, "loss": 0.6114, "accuracy": 0.984375, "learning_rate": 4.476305332245662e-06, "epoch": 0.8660550458715597, "percentage": 28.92, "elapsed_time": "0:39:21", "remaining_time": "1:36:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 120, "total_steps": 408, "loss": 0.6166, "accuracy": 0.984375, "learning_rate": 4.449804225621116e-06, "epoch": 0.8807339449541285, "percentage": 29.41, "elapsed_time": "0:39:56", "remaining_time": "1:35:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 122, "total_steps": 408, "loss": 0.6105, "accuracy": 0.984375, "learning_rate": 4.422731629822887e-06, "epoch": 0.8954128440366973, "percentage": 29.9, "elapsed_time": "0:40:37", "remaining_time": "1:35:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 124, "total_steps": 408, "loss": 0.6109, "accuracy": 0.96875, "learning_rate": 4.395095479850396e-06, "epoch": 0.9100917431192661, "percentage": 30.39, "elapsed_time": "0:41:08", "remaining_time": "1:34:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 126, "total_steps": 408, "loss": 0.6005, "accuracy": 1.0, "learning_rate": 4.366903875881243e-06, "epoch": 0.9247706422018349, "percentage": 30.88, "elapsed_time": "0:41:52", "remaining_time": "1:33:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 128, "total_steps": 408, "loss": 0.608, "accuracy": 0.984375, "learning_rate": 4.3381650808970365e-06, "epoch": 0.9394495412844037, "percentage": 31.37, "elapsed_time": "0:42:25", "remaining_time": "1:32:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 130, "total_steps": 408, "loss": 0.6011, "accuracy": 1.0, "learning_rate": 4.308887518261507e-06, "epoch": 0.9541284403669725, "percentage": 31.86, "elapsed_time": "0:43:01", "remaining_time": "1:32:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 132, "total_steps": 408, "loss": 0.596, "accuracy": 0.984375, "learning_rate": 4.279079769251617e-06, "epoch": 0.9688073394495413, "percentage": 32.35, "elapsed_time": "0:43:47", "remaining_time": "1:31:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 134, "total_steps": 408, "loss": 0.5983, "accuracy": 1.0, "learning_rate": 4.248750570542373e-06, "epoch": 0.9834862385321101, "percentage": 32.84, "elapsed_time": "0:44:23", "remaining_time": "1:30:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 136, "total_steps": 408, "loss": 0.5837, "accuracy": 0.984375, "learning_rate": 4.21790881164611e-06, "epoch": 0.998165137614679, "percentage": 33.33, "elapsed_time": "0:44:59", "remaining_time": "1:29:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 138, "total_steps": 408, "loss": 0.5889, "accuracy": 1.0, "learning_rate": 4.186563532306957e-06, "epoch": 1.0128440366972478, "percentage": 33.82, "elapsed_time": "0:45:33", "remaining_time": "1:29:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 140, "total_steps": 408, "loss": 0.5958, "accuracy": 1.0, "learning_rate": 4.154723919851291e-06, "epoch": 1.0275229357798166, "percentage": 34.31, "elapsed_time": "0:46:10", "remaining_time": "1:28:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 142, "total_steps": 408, "loss": 0.5867, "accuracy": 0.984375, "learning_rate": 4.122399306494918e-06, "epoch": 1.0422018348623854, "percentage": 34.8, "elapsed_time": "0:46:54", "remaining_time": "1:27:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 144, "total_steps": 408, "loss": 0.5708, "accuracy": 1.0, "learning_rate": 4.089599166607794e-06, "epoch": 1.0568807339449542, "percentage": 35.29, "elapsed_time": "0:47:30", "remaining_time": "1:27:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 146, "total_steps": 408, "loss": 0.5854, "accuracy": 1.0, "learning_rate": 4.05633311393708e-06, "epoch": 1.071559633027523, "percentage": 35.78, "elapsed_time": "0:48:11", "remaining_time": "1:26:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 148, "total_steps": 408, "loss": 0.5746, "accuracy": 0.984375, "learning_rate": 4.022610898789349e-06, "epoch": 1.0862385321100918, "percentage": 36.27, "elapsed_time": "0:48:43", "remaining_time": "1:25:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 150, "total_steps": 408, "loss": 0.5678, "accuracy": 1.0, "learning_rate": 3.988442405172755e-06, "epoch": 1.1009174311926606, "percentage": 36.76, "elapsed_time": "0:49:25", "remaining_time": "1:25:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 152, "total_steps": 408, "loss": 0.5624, "accuracy": 1.0, "learning_rate": 3.953837647900031e-06, "epoch": 1.1155963302752294, "percentage": 37.25, "elapsed_time": "0:50:07", "remaining_time": "1:24:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 154, "total_steps": 408, "loss": 0.5681, "accuracy": 0.984375, "learning_rate": 3.918806769653135e-06, "epoch": 1.1302752293577982, "percentage": 37.75, "elapsed_time": "0:50:52", "remaining_time": "1:23:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 156, "total_steps": 408, "loss": 0.5765, "accuracy": 1.0, "learning_rate": 3.88336003801042e-06, "epoch": 1.144954128440367, "percentage": 38.24, "elapsed_time": "0:51:24", "remaining_time": "1:23:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 158, "total_steps": 408, "loss": 0.5538, "accuracy": 1.0, "learning_rate": 3.847507842437205e-06, "epoch": 1.1596330275229358, "percentage": 38.73, "elapsed_time": "0:51:58", "remaining_time": "1:22:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 160, "total_steps": 408, "loss": 0.5534, "accuracy": 1.0, "learning_rate": 3.811260691240604e-06, "epoch": 1.1743119266055047, "percentage": 39.22, "elapsed_time": "0:52:34", "remaining_time": "1:21:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 162, "total_steps": 408, "loss": 0.5679, "accuracy": 1.0, "learning_rate": 3.774629208489547e-06, "epoch": 1.1889908256880735, "percentage": 39.71, "elapsed_time": "0:53:06", "remaining_time": "1:20:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 164, "total_steps": 408, "loss": 0.5553, "accuracy": 1.0, "learning_rate": 3.7376241309008433e-06, "epoch": 1.2036697247706423, "percentage": 40.2, "elapsed_time": "0:53:44", "remaining_time": "1:19:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 166, "total_steps": 408, "loss": 0.5417, "accuracy": 1.0, "learning_rate": 3.7002563046922502e-06, "epoch": 1.218348623853211, "percentage": 40.69, "elapsed_time": "0:54:37", "remaining_time": "1:19:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 168, "total_steps": 408, "loss": 0.53, "accuracy": 1.0, "learning_rate": 3.6625366824034337e-06, "epoch": 1.2330275229357799, "percentage": 41.18, "elapsed_time": "0:55:17", "remaining_time": "1:18:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 170, "total_steps": 408, "loss": 0.5383, "accuracy": 1.0, "learning_rate": 3.6244763196857714e-06, "epoch": 1.2477064220183487, "percentage": 41.67, "elapsed_time": "0:56:03", "remaining_time": "1:18:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 172, "total_steps": 408, "loss": 0.5446, "accuracy": 1.0, "learning_rate": 3.5860863720619333e-06, "epoch": 1.2623853211009175, "percentage": 42.16, "elapsed_time": "0:56:50", "remaining_time": "1:17:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 174, "total_steps": 408, "loss": 0.5396, "accuracy": 1.0, "learning_rate": 3.547378091656186e-06, "epoch": 1.2770642201834863, "percentage": 42.65, "elapsed_time": "0:57:26", "remaining_time": "1:17:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 176, "total_steps": 408, "loss": 0.5512, "accuracy": 1.0, "learning_rate": 3.5083628238963913e-06, "epoch": 1.2917431192660551, "percentage": 43.14, "elapsed_time": "0:58:15", "remaining_time": "1:16:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 178, "total_steps": 408, "loss": 0.5392, "accuracy": 1.0, "learning_rate": 3.4690520041886473e-06, "epoch": 1.306422018348624, "percentage": 43.63, "elapsed_time": "0:58:57", "remaining_time": "1:16:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 180, "total_steps": 408, "loss": 0.5183, "accuracy": 1.0, "learning_rate": 3.4294571545655653e-06, "epoch": 1.3211009174311927, "percentage": 44.12, "elapsed_time": "0:59:39", "remaining_time": "1:15:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 182, "total_steps": 408, "loss": 0.5321, "accuracy": 0.96875, "learning_rate": 3.38958988030915e-06, "epoch": 1.3357798165137615, "percentage": 44.61, "elapsed_time": "1:00:27", "remaining_time": "1:15:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 184, "total_steps": 408, "loss": 0.5528, "accuracy": 1.0, "learning_rate": 3.3494618665492833e-06, "epoch": 1.3504587155963304, "percentage": 45.1, "elapsed_time": "1:01:05", "remaining_time": "1:14:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 186, "total_steps": 408, "loss": 0.515, "accuracy": 1.0, "learning_rate": 3.3090848748388042e-06, "epoch": 1.3651376146788992, "percentage": 45.59, "elapsed_time": "1:01:49", "remaining_time": "1:13:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 188, "total_steps": 408, "loss": 0.5302, "accuracy": 1.0, "learning_rate": 3.2684707397061887e-06, "epoch": 1.379816513761468, "percentage": 46.08, "elapsed_time": "1:02:46", "remaining_time": "1:13:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 190, "total_steps": 408, "loss": 0.5244, "accuracy": 1.0, "learning_rate": 3.2276313651868364e-06, "epoch": 1.3944954128440368, "percentage": 46.57, "elapsed_time": "1:03:20", "remaining_time": "1:12:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 192, "total_steps": 408, "loss": 0.5108, "accuracy": 1.0, "learning_rate": 3.1865787213339926e-06, "epoch": 1.4091743119266056, "percentage": 47.06, "elapsed_time": "1:03:55", "remaining_time": "1:11:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 194, "total_steps": 408, "loss": 0.5255, "accuracy": 1.0, "learning_rate": 3.1453248407103156e-06, "epoch": 1.4238532110091744, "percentage": 47.55, "elapsed_time": "1:04:33", "remaining_time": "1:11:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 196, "total_steps": 408, "loss": 0.5117, "accuracy": 1.0, "learning_rate": 3.1038818148611178e-06, "epoch": 1.4385321100917432, "percentage": 48.04, "elapsed_time": "1:05:06", "remaining_time": "1:10:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 198, "total_steps": 408, "loss": 0.5311, "accuracy": 0.984375, "learning_rate": 3.062261790770331e-06, "epoch": 1.453211009174312, "percentage": 48.53, "elapsed_time": "1:05:40", "remaining_time": "1:09:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 200, "total_steps": 408, "loss": 0.5133, "accuracy": 1.0, "learning_rate": 3.0204769673002123e-06, "epoch": 1.4678899082568808, "percentage": 49.02, "elapsed_time": "1:06:15", "remaining_time": "1:08:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 202, "total_steps": 408, "loss": 0.5065, "accuracy": 0.984375, "learning_rate": 2.978539591615848e-06, "epoch": 1.4825688073394496, "percentage": 49.51, "elapsed_time": "1:06:47", "remaining_time": "1:08:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 204, "total_steps": 408, "loss": 0.5078, "accuracy": 1.0, "learning_rate": 2.936461955595501e-06, "epoch": 1.4972477064220184, "percentage": 50.0, "elapsed_time": "1:07:20", "remaining_time": "1:07:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 206, "total_steps": 408, "loss": 0.4952, "accuracy": 1.0, "learning_rate": 2.8942563922278487e-06, "epoch": 1.5119266055045872, "percentage": 50.49, "elapsed_time": "1:07:57", "remaining_time": "1:06:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 208, "total_steps": 408, "loss": 0.5053, "accuracy": 1.0, "learning_rate": 2.8519352719971783e-06, "epoch": 1.526605504587156, "percentage": 50.98, "elapsed_time": "1:08:43", "remaining_time": "1:06:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 210, "total_steps": 408, "loss": 0.4931, "accuracy": 1.0, "learning_rate": 2.8095109992575824e-06, "epoch": 1.5412844036697249, "percentage": 51.47, "elapsed_time": "1:09:27", "remaining_time": "1:05:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 212, "total_steps": 408, "loss": 0.496, "accuracy": 1.0, "learning_rate": 2.7669960085972407e-06, "epoch": 1.5559633027522937, "percentage": 51.96, "elapsed_time": "1:10:09", "remaining_time": "1:04:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 214, "total_steps": 408, "loss": 0.4979, "accuracy": 1.0, "learning_rate": 2.7244027611938247e-06, "epoch": 1.5706422018348625, "percentage": 52.45, "elapsed_time": "1:10:44", "remaining_time": "1:04:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 216, "total_steps": 408, "loss": 0.5008, "accuracy": 0.984375, "learning_rate": 2.6817437411621194e-06, "epoch": 1.5853211009174313, "percentage": 52.94, "elapsed_time": "1:11:25", "remaining_time": "1:03:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 218, "total_steps": 408, "loss": 0.4828, "accuracy": 1.0, "learning_rate": 2.639031451894923e-06, "epoch": 1.6, "percentage": 53.43, "elapsed_time": "1:12:17", "remaining_time": "1:03:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 220, "total_steps": 408, "loss": 0.4815, "accuracy": 1.0, "learning_rate": 2.5962784123982843e-06, "epoch": 1.614678899082569, "percentage": 53.92, "elapsed_time": "1:12:58", "remaining_time": "1:02:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 222, "total_steps": 408, "loss": 0.4908, "accuracy": 1.0, "learning_rate": 2.5534971536221804e-06, "epoch": 1.6293577981651377, "percentage": 54.41, "elapsed_time": "1:13:36", "remaining_time": "1:01:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 224, "total_steps": 408, "loss": 0.4773, "accuracy": 1.0, "learning_rate": 2.5107002147876814e-06, "epoch": 1.6440366972477065, "percentage": 54.9, "elapsed_time": "1:14:11", "remaining_time": "1:00:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 226, "total_steps": 408, "loss": 0.4953, "accuracy": 0.984375, "learning_rate": 2.467900139711693e-06, "epoch": 1.6587155963302753, "percentage": 55.39, "elapsed_time": "1:14:50", "remaining_time": "1:00:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 228, "total_steps": 408, "loss": 0.478, "accuracy": 1.0, "learning_rate": 2.4251094731303586e-06, "epoch": 1.6733944954128441, "percentage": 55.88, "elapsed_time": "1:15:36", "remaining_time": "0:59:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 230, "total_steps": 408, "loss": 0.4758, "accuracy": 1.0, "learning_rate": 2.3823407570221812e-06, "epoch": 1.688073394495413, "percentage": 56.37, "elapsed_time": "1:16:10", "remaining_time": "0:58:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 232, "total_steps": 408, "loss": 0.4719, "accuracy": 1.0, "learning_rate": 2.3396065269319655e-06, "epoch": 1.7027522935779817, "percentage": 56.86, "elapsed_time": "1:16:45", "remaining_time": "0:58:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 234, "total_steps": 408, "loss": 0.4571, "accuracy": 1.0, "learning_rate": 2.2969193082966353e-06, "epoch": 1.7174311926605506, "percentage": 57.35, "elapsed_time": "1:17:18", "remaining_time": "0:57:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 236, "total_steps": 408, "loss": 0.4653, "accuracy": 1.0, "learning_rate": 2.2542916127740194e-06, "epoch": 1.7321100917431194, "percentage": 57.84, "elapsed_time": "1:17:56", "remaining_time": "0:56:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 238, "total_steps": 408, "loss": 0.4837, "accuracy": 1.0, "learning_rate": 2.211735934575674e-06, "epoch": 1.7467889908256882, "percentage": 58.33, "elapsed_time": "1:18:34", "remaining_time": "0:56:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 240, "total_steps": 408, "loss": 0.4323, "accuracy": 1.0, "learning_rate": 2.1692647468048235e-06, "epoch": 1.761467889908257, "percentage": 58.82, "elapsed_time": "1:19:09", "remaining_time": "0:55:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 242, "total_steps": 408, "loss": 0.4772, "accuracy": 1.0, "learning_rate": 2.126890497800477e-06, "epoch": 1.7761467889908258, "percentage": 59.31, "elapsed_time": "1:19:44", "remaining_time": "0:54:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 244, "total_steps": 408, "loss": 0.4475, "accuracy": 1.0, "learning_rate": 2.084625607488816e-06, "epoch": 1.7908256880733946, "percentage": 59.8, "elapsed_time": "1:20:22", "remaining_time": "0:54:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 246, "total_steps": 408, "loss": 0.4525, "accuracy": 1.0, "learning_rate": 2.0424824637428995e-06, "epoch": 1.8055045871559634, "percentage": 60.29, "elapsed_time": "1:20:59", "remaining_time": "0:53:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 248, "total_steps": 408, "loss": 0.4711, "accuracy": 1.0, "learning_rate": 2.0004734187517744e-06, "epoch": 1.8201834862385322, "percentage": 60.78, "elapsed_time": "1:21:52", "remaining_time": "0:52:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 250, "total_steps": 408, "loss": 0.4587, "accuracy": 0.984375, "learning_rate": 1.9586107854000327e-06, "epoch": 1.834862385321101, "percentage": 61.27, "elapsed_time": "1:22:43", "remaining_time": "0:52:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 252, "total_steps": 408, "loss": 0.4397, "accuracy": 1.0, "learning_rate": 1.916906833658899e-06, "epoch": 1.8495412844036698, "percentage": 61.76, "elapsed_time": "1:23:16", "remaining_time": "0:51:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 254, "total_steps": 408, "loss": 0.4282, "accuracy": 1.0, "learning_rate": 1.8753737869898921e-06, "epoch": 1.8642201834862386, "percentage": 62.25, "elapsed_time": "1:23:56", "remaining_time": "0:50:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 256, "total_steps": 408, "loss": 0.4631, "accuracy": 0.984375, "learning_rate": 1.8340238187621185e-06, "epoch": 1.8788990825688074, "percentage": 62.75, "elapsed_time": "1:24:31", "remaining_time": "0:50:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 258, "total_steps": 408, "loss": 0.4476, "accuracy": 1.0, "learning_rate": 1.7928690486842438e-06, "epoch": 1.8935779816513763, "percentage": 63.24, "elapsed_time": "1:25:12", "remaining_time": "0:49:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 260, "total_steps": 408, "loss": 0.4325, "accuracy": 0.984375, "learning_rate": 1.7519215392522026e-06, "epoch": 1.908256880733945, "percentage": 63.73, "elapsed_time": "1:25:52", "remaining_time": "0:48:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 262, "total_steps": 408, "loss": 0.4334, "accuracy": 1.0, "learning_rate": 1.7111932922136715e-06, "epoch": 1.9229357798165139, "percentage": 64.22, "elapsed_time": "1:26:27", "remaining_time": "0:48:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 264, "total_steps": 408, "loss": 0.4097, "accuracy": 1.0, "learning_rate": 1.6706962450503408e-06, "epoch": 1.9376146788990827, "percentage": 64.71, "elapsed_time": "1:27:03", "remaining_time": "0:47:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 266, "total_steps": 408, "loss": 0.4194, "accuracy": 1.0, "learning_rate": 1.630442267479034e-06, "epoch": 1.9522935779816515, "percentage": 65.2, "elapsed_time": "1:27:44", "remaining_time": "0:46:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 268, "total_steps": 408, "loss": 0.4249, "accuracy": 1.0, "learning_rate": 1.5904431579726837e-06, "epoch": 1.9669724770642203, "percentage": 65.69, "elapsed_time": "1:28:20", "remaining_time": "0:46:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 270, "total_steps": 408, "loss": 0.409, "accuracy": 1.0, "learning_rate": 1.5507106403021897e-06, "epoch": 1.981651376146789, "percentage": 66.18, "elapsed_time": "1:28:59", "remaining_time": "0:45:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 272, "total_steps": 408, "loss": 0.4173, "accuracy": 1.0, "learning_rate": 1.511256360100171e-06, "epoch": 1.996330275229358, "percentage": 66.67, "elapsed_time": "1:29:33", "remaining_time": "0:44:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 274, "total_steps": 408, "loss": 0.4012, "accuracy": 1.0, "learning_rate": 1.4720918814476234e-06, "epoch": 2.0110091743119267, "percentage": 67.16, "elapsed_time": "1:30:17", "remaining_time": "0:44:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 276, "total_steps": 408, "loss": 0.4338, "accuracy": 0.984375, "learning_rate": 1.4332286834844792e-06, "epoch": 2.0256880733944955, "percentage": 67.65, "elapsed_time": "1:31:07", "remaining_time": "0:43:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 278, "total_steps": 408, "loss": 0.4167, "accuracy": 1.0, "learning_rate": 1.3946781570450563e-06, "epoch": 2.0403669724770643, "percentage": 68.14, "elapsed_time": "1:31:51", "remaining_time": "0:42:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 280, "total_steps": 408, "loss": 0.3969, "accuracy": 1.0, "learning_rate": 1.3564516013194023e-06, "epoch": 2.055045871559633, "percentage": 68.63, "elapsed_time": "1:32:22", "remaining_time": "0:42:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 282, "total_steps": 408, "loss": 0.4159, "accuracy": 1.0, "learning_rate": 1.3185602205414894e-06, "epoch": 2.069724770642202, "percentage": 69.12, "elapsed_time": "1:33:04", "remaining_time": "0:41:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 284, "total_steps": 408, "loss": 0.4115, "accuracy": 1.0, "learning_rate": 1.2810151207052465e-06, "epoch": 2.0844036697247708, "percentage": 69.61, "elapsed_time": "1:33:58", "remaining_time": "0:41:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 286, "total_steps": 408, "loss": 0.4249, "accuracy": 0.96875, "learning_rate": 1.2438273063093811e-06, "epoch": 2.0990825688073396, "percentage": 70.1, "elapsed_time": "1:34:30", "remaining_time": "0:40:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 288, "total_steps": 408, "loss": 0.4411, "accuracy": 0.984375, "learning_rate": 1.2070076771319536e-06, "epoch": 2.1137614678899084, "percentage": 70.59, "elapsed_time": "1:35:21", "remaining_time": "0:39:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 290, "total_steps": 408, "loss": 0.3927, "accuracy": 1.0, "learning_rate": 1.1705670250356417e-06, "epoch": 2.128440366972477, "percentage": 71.08, "elapsed_time": "1:35:59", "remaining_time": "0:39:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 292, "total_steps": 408, "loss": 0.3851, "accuracy": 0.984375, "learning_rate": 1.1345160308046413e-06, "epoch": 2.143119266055046, "percentage": 71.57, "elapsed_time": "1:36:40", "remaining_time": "0:38:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 294, "total_steps": 408, "loss": 0.4036, "accuracy": 1.0, "learning_rate": 1.0988652610141154e-06, "epoch": 2.157798165137615, "percentage": 72.06, "elapsed_time": "1:37:13", "remaining_time": "0:37:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 296, "total_steps": 408, "loss": 0.3531, "accuracy": 0.96875, "learning_rate": 1.063625164933124e-06, "epoch": 2.1724770642201836, "percentage": 72.55, "elapsed_time": "1:37:51", "remaining_time": "0:37:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 298, "total_steps": 408, "loss": 0.3905, "accuracy": 0.984375, "learning_rate": 1.0288060714619359e-06, "epoch": 2.1871559633027524, "percentage": 73.04, "elapsed_time": "1:38:35", "remaining_time": "0:36:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 300, "total_steps": 408, "loss": 0.3944, "accuracy": 0.953125, "learning_rate": 9.944181861046188e-07, "epoch": 2.2018348623853212, "percentage": 73.53, "elapsed_time": "1:39:11", "remaining_time": "0:35:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 302, "total_steps": 408, "loss": 0.3973, "accuracy": 0.984375, "learning_rate": 9.604715879777986e-07, "epoch": 2.21651376146789, "percentage": 74.02, "elapsed_time": "1:39:46", "remaining_time": "0:35:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 304, "total_steps": 408, "loss": 0.4002, "accuracy": 1.0, "learning_rate": 9.269762268564616e-07, "epoch": 2.231192660550459, "percentage": 74.51, "elapsed_time": "1:40:30", "remaining_time": "0:34:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 306, "total_steps": 408, "loss": 0.4307, "accuracy": 0.984375, "learning_rate": 8.939419202576694e-07, "epoch": 2.2458715596330276, "percentage": 75.0, "elapsed_time": "1:41:00", "remaining_time": "0:33:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 308, "total_steps": 408, "loss": 0.3881, "accuracy": 1.0, "learning_rate": 8.61378350563033e-07, "epoch": 2.2605504587155965, "percentage": 75.49, "elapsed_time": "1:41:32", "remaining_time": "0:32:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 310, "total_steps": 408, "loss": 0.3722, "accuracy": 1.0, "learning_rate": 8.292950621808022e-07, "epoch": 2.2752293577981653, "percentage": 75.98, "elapsed_time": "1:42:06", "remaining_time": "0:32:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 312, "total_steps": 408, "loss": 0.3736, "accuracy": 0.96875, "learning_rate": 7.977014587483925e-07, "epoch": 2.289908256880734, "percentage": 76.47, "elapsed_time": "1:42:57", "remaining_time": "0:31:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 314, "total_steps": 408, "loss": 0.3822, "accuracy": 0.96875, "learning_rate": 7.666068003761684e-07, "epoch": 2.304587155963303, "percentage": 76.96, "elapsed_time": "1:43:35", "remaining_time": "0:31:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 316, "total_steps": 408, "loss": 0.3766, "accuracy": 0.984375, "learning_rate": 7.360202009332993e-07, "epoch": 2.3192660550458717, "percentage": 77.45, "elapsed_time": "1:44:14", "remaining_time": "0:30:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 318, "total_steps": 408, "loss": 0.3588, "accuracy": 0.984375, "learning_rate": 7.059506253764773e-07, "epoch": 2.3339449541284405, "percentage": 77.94, "elapsed_time": "1:44:53", "remaining_time": "0:29:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 320, "total_steps": 408, "loss": 0.3804, "accuracy": 0.984375, "learning_rate": 6.764068871222825e-07, "epoch": 2.3486238532110093, "percentage": 78.43, "elapsed_time": "1:45:32", "remaining_time": "0:29:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 322, "total_steps": 408, "loss": 0.3688, "accuracy": 1.0, "learning_rate": 6.473976454639608e-07, "epoch": 2.363302752293578, "percentage": 78.92, "elapsed_time": "1:46:07", "remaining_time": "0:28:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 324, "total_steps": 408, "loss": 0.3605, "accuracy": 0.984375, "learning_rate": 6.189314030333796e-07, "epoch": 2.377981651376147, "percentage": 79.41, "elapsed_time": "1:46:44", "remaining_time": "0:27:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 326, "total_steps": 408, "loss": 0.3747, "accuracy": 0.984375, "learning_rate": 5.910165033089e-07, "epoch": 2.3926605504587157, "percentage": 79.9, "elapsed_time": "1:47:23", "remaining_time": "0:27:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 328, "total_steps": 408, "loss": 0.3875, "accuracy": 1.0, "learning_rate": 5.636611281698956e-07, "epoch": 2.4073394495412845, "percentage": 80.39, "elapsed_time": "1:48:02", "remaining_time": "0:26:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 330, "total_steps": 408, "loss": 0.3811, "accuracy": 1.0, "learning_rate": 5.368732954986389e-07, "epoch": 2.4220183486238533, "percentage": 80.88, "elapsed_time": "1:48:56", "remaining_time": "0:25:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 332, "total_steps": 408, "loss": 0.3586, "accuracy": 0.984375, "learning_rate": 5.106608568302504e-07, "epoch": 2.436697247706422, "percentage": 81.37, "elapsed_time": "1:49:39", "remaining_time": "0:25:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 334, "total_steps": 408, "loss": 0.361, "accuracy": 0.984375, "learning_rate": 4.850314950514124e-07, "epoch": 2.451376146788991, "percentage": 81.86, "elapsed_time": "1:50:10", "remaining_time": "0:24:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 336, "total_steps": 408, "loss": 0.383, "accuracy": 0.984375, "learning_rate": 4.599927221485034e-07, "epoch": 2.4660550458715598, "percentage": 82.35, "elapsed_time": "1:50:50", "remaining_time": "0:23:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 338, "total_steps": 408, "loss": 0.3509, "accuracy": 1.0, "learning_rate": 4.3555187700583175e-07, "epoch": 2.4807339449541286, "percentage": 82.84, "elapsed_time": "1:51:30", "remaining_time": "0:23:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 340, "total_steps": 408, "loss": 0.3873, "accuracy": 0.984375, "learning_rate": 4.1171612325460244e-07, "epoch": 2.4954128440366974, "percentage": 83.33, "elapsed_time": "1:52:11", "remaining_time": "0:22:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 342, "total_steps": 408, "loss": 0.3455, "accuracy": 0.984375, "learning_rate": 3.8849244717325206e-07, "epoch": 2.510091743119266, "percentage": 83.82, "elapsed_time": "1:52:50", "remaining_time": "0:21:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 344, "total_steps": 408, "loss": 0.379, "accuracy": 0.96875, "learning_rate": 3.658876556397628e-07, "epoch": 2.524770642201835, "percentage": 84.31, "elapsed_time": "1:53:32", "remaining_time": "0:21:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 346, "total_steps": 408, "loss": 0.3594, "accuracy": 1.0, "learning_rate": 3.4390837413656256e-07, "epoch": 2.539449541284404, "percentage": 84.8, "elapsed_time": "1:54:13", "remaining_time": "0:20:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 348, "total_steps": 408, "loss": 0.3636, "accuracy": 0.96875, "learning_rate": 3.225610448085903e-07, "epoch": 2.5541284403669726, "percentage": 85.29, "elapsed_time": "1:54:49", "remaining_time": "0:19:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 350, "total_steps": 408, "loss": 0.366, "accuracy": 0.984375, "learning_rate": 3.018519245750989e-07, "epoch": 2.5688073394495414, "percentage": 85.78, "elapsed_time": "1:55:25", "remaining_time": "0:19:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 352, "total_steps": 408, "loss": 0.3691, "accuracy": 0.984375, "learning_rate": 2.817870832957459e-07, "epoch": 2.5834862385321102, "percentage": 86.27, "elapsed_time": "1:55:55", "remaining_time": "0:18:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 354, "total_steps": 408, "loss": 0.3916, "accuracy": 0.9375, "learning_rate": 2.6237240199151386e-07, "epoch": 2.598165137614679, "percentage": 86.76, "elapsed_time": "1:56:41", "remaining_time": "0:17:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 356, "total_steps": 408, "loss": 0.3934, "accuracy": 1.0, "learning_rate": 2.436135711209786e-07, "epoch": 2.612844036697248, "percentage": 87.25, "elapsed_time": "1:57:29", "remaining_time": "0:17:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 358, "total_steps": 408, "loss": 0.3921, "accuracy": 0.984375, "learning_rate": 2.2551608891243026e-07, "epoch": 2.6275229357798167, "percentage": 87.75, "elapsed_time": "1:58:13", "remaining_time": "0:16:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 360, "total_steps": 408, "loss": 0.373, "accuracy": 1.0, "learning_rate": 2.0808525975233807e-07, "epoch": 2.6422018348623855, "percentage": 88.24, "elapsed_time": "1:58:47", "remaining_time": "0:15:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 362, "total_steps": 408, "loss": 0.3499, "accuracy": 0.984375, "learning_rate": 1.9132619263063144e-07, "epoch": 2.6568807339449543, "percentage": 88.73, "elapsed_time": "1:59:32", "remaining_time": "0:15:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 364, "total_steps": 408, "loss": 0.3701, "accuracy": 0.984375, "learning_rate": 1.7524379964325155e-07, "epoch": 2.671559633027523, "percentage": 89.22, "elapsed_time": "2:00:12", "remaining_time": "0:14:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 366, "total_steps": 408, "loss": 0.3558, "accuracy": 1.0, "learning_rate": 1.5984279455240975e-07, "epoch": 2.686238532110092, "percentage": 89.71, "elapsed_time": "2:00:51", "remaining_time": "0:13:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 368, "total_steps": 408, "loss": 0.365, "accuracy": 1.0, "learning_rate": 1.451276914049818e-07, "epoch": 2.7009174311926607, "percentage": 90.2, "elapsed_time": "2:01:29", "remaining_time": "0:13:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 370, "total_steps": 408, "loss": 0.3549, "accuracy": 0.96875, "learning_rate": 1.3110280320943692e-07, "epoch": 2.7155963302752295, "percentage": 90.69, "elapsed_time": "2:02:05", "remaining_time": "0:12:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 372, "total_steps": 408, "loss": 0.3445, "accuracy": 0.984375, "learning_rate": 1.1777224067169218e-07, "epoch": 2.7302752293577983, "percentage": 91.18, "elapsed_time": "2:02:45", "remaining_time": "0:11:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 374, "total_steps": 408, "loss": 0.3888, "accuracy": 0.984375, "learning_rate": 1.0513991099025872e-07, "epoch": 2.744954128440367, "percentage": 91.67, "elapsed_time": "2:03:30", "remaining_time": "0:11:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 376, "total_steps": 408, "loss": 0.3629, "accuracy": 0.984375, "learning_rate": 9.320951671104194e-08, "epoch": 2.759633027522936, "percentage": 92.16, "elapsed_time": "2:04:12", "remaining_time": "0:10:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 378, "total_steps": 408, "loss": 0.3533, "accuracy": 0.984375, "learning_rate": 8.198455464212108e-08, "epoch": 2.7743119266055047, "percentage": 92.65, "elapsed_time": "2:04:50", "remaining_time": "0:09:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 380, "total_steps": 408, "loss": 0.34, "accuracy": 0.984375, "learning_rate": 7.146831482883115e-08, "epoch": 2.7889908256880735, "percentage": 93.14, "elapsed_time": "2:05:22", "remaining_time": "0:09:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 382, "total_steps": 408, "loss": 0.3668, "accuracy": 0.96875, "learning_rate": 6.16638795894492e-08, "epoch": 2.8036697247706424, "percentage": 93.63, "elapsed_time": "2:05:55", "remaining_time": "0:08:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 384, "total_steps": 408, "loss": 0.3605, "accuracy": 1.0, "learning_rate": 5.257412261176375e-08, "epoch": 2.818348623853211, "percentage": 94.12, "elapsed_time": "2:06:41", "remaining_time": "0:07:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 386, "total_steps": 408, "loss": 0.3729, "accuracy": 0.984375, "learning_rate": 4.4201708110795384e-08, "epoch": 2.83302752293578, "percentage": 94.61, "elapsed_time": "2:07:16", "remaining_time": "0:07:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 388, "total_steps": 408, "loss": 0.3548, "accuracy": 0.984375, "learning_rate": 3.654909004791152e-08, "epoch": 2.847706422018349, "percentage": 95.1, "elapsed_time": "2:07:58", "remaining_time": "0:06:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 390, "total_steps": 408, "loss": 0.3783, "accuracy": 0.953125, "learning_rate": 2.9618511411570462e-08, "epoch": 2.8623853211009176, "percentage": 95.59, "elapsed_time": "2:08:29", "remaining_time": "0:05:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 392, "total_steps": 408, "loss": 0.3728, "accuracy": 0.984375, "learning_rate": 2.3412003559898088e-08, "epoch": 2.8770642201834864, "percentage": 96.08, "elapsed_time": "2:09:05", "remaining_time": "0:05:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 394, "total_steps": 408, "loss": 0.375, "accuracy": 0.984375, "learning_rate": 1.793138562529634e-08, "epoch": 2.891743119266055, "percentage": 96.57, "elapsed_time": "2:09:51", "remaining_time": "0:04:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 396, "total_steps": 408, "loss": 0.3385, "accuracy": 0.96875, "learning_rate": 1.317826398125277e-08, "epoch": 2.906422018348624, "percentage": 97.06, "elapsed_time": "2:10:47", "remaining_time": "0:03:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 398, "total_steps": 408, "loss": 0.3416, "accuracy": 1.0, "learning_rate": 9.15403177151275e-09, "epoch": 2.921100917431193, "percentage": 97.55, "elapsed_time": "2:11:29", "remaining_time": "0:03:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 400, "total_steps": 408, "loss": 0.3473, "accuracy": 0.984375, "learning_rate": 5.85986850174608e-09, "epoch": 2.9357798165137616, "percentage": 98.04, "elapsed_time": "2:12:02", "remaining_time": "0:02:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 402, "total_steps": 408, "loss": 0.4044, "accuracy": 0.9375, "learning_rate": 3.296739693834927e-09, "epoch": 2.9504587155963304, "percentage": 98.53, "elapsed_time": "2:12:38", "remaining_time": "0:01:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 404, "total_steps": 408, "loss": 0.3315, "accuracy": 0.984375, "learning_rate": 1.4653966028774225e-09, "epoch": 2.9651376146788992, "percentage": 99.02, "elapsed_time": "2:13:11", "remaining_time": "0:01:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 406, "total_steps": 408, "loss": 0.3713, "accuracy": 1.0, "learning_rate": 3.6637599699351766e-10, "epoch": 2.979816513761468, "percentage": 99.51, "elapsed_time": "2:13:52", "remaining_time": "0:00:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 408, "total_steps": 408, "loss": 0.355, "accuracy": 0.984375, "learning_rate": 0.0, "epoch": 2.994495412844037, "percentage": 100.0, "elapsed_time": "2:14:33", "remaining_time": "0:00:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 408, "total_steps": 408, "epoch": 2.994495412844037, "percentage": 100.0, "elapsed_time": "2:14:33", "remaining_time": "0:00:00", "throughput": "0.00", "total_tokens": 0}