File size: 52,062 Bytes
a8aec59 4f7f79e |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 107 108 109 110 111 112 113 114 115 116 117 118 119 120 121 122 123 124 125 126 127 128 129 130 131 132 133 134 135 136 137 138 139 140 141 142 143 144 145 146 147 148 149 150 151 152 153 154 155 156 157 158 159 160 161 162 163 164 165 166 167 168 169 170 171 172 173 174 175 176 177 178 179 180 181 182 183 184 185 186 187 188 189 190 191 192 193 194 195 196 197 198 199 200 201 202 203 204 205 206 207 208 209 210 211 212 213 214 215 216 217 218 219 220 221 222 223 224 225 226 227 228 229 230 231 232 233 234 235 236 237 238 239 240 241 242 243 244 245 246 247 248 249 250 251 252 253 254 255 256 257 258 259 260 261 262 263 264 265 266 267 268 269 270 271 272 273 274 275 |
{"current_steps": 10, "total_steps": 2724, "loss": 0.7005, "learning_rate": 5e-06, "epoch": 0.01100715465052284, "percentage": 0.37, "elapsed_time": "0:01:32", "remaining_time": "6:58:19"}
{"current_steps": 20, "total_steps": 2724, "loss": 0.6377, "learning_rate": 5e-06, "epoch": 0.02201430930104568, "percentage": 0.73, "elapsed_time": "0:02:56", "remaining_time": "6:36:35"}
{"current_steps": 30, "total_steps": 2724, "loss": 0.6063, "learning_rate": 5e-06, "epoch": 0.03302146395156852, "percentage": 1.1, "elapsed_time": "0:04:19", "remaining_time": "6:28:02"}
{"current_steps": 40, "total_steps": 2724, "loss": 0.5969, "learning_rate": 5e-06, "epoch": 0.04402861860209136, "percentage": 1.47, "elapsed_time": "0:05:42", "remaining_time": "6:22:59"}
{"current_steps": 50, "total_steps": 2724, "loss": 0.5714, "learning_rate": 5e-06, "epoch": 0.0550357732526142, "percentage": 1.84, "elapsed_time": "0:07:05", "remaining_time": "6:19:29"}
{"current_steps": 60, "total_steps": 2724, "loss": 0.5648, "learning_rate": 5e-06, "epoch": 0.06604292790313704, "percentage": 2.2, "elapsed_time": "0:08:29", "remaining_time": "6:16:51"}
{"current_steps": 70, "total_steps": 2724, "loss": 0.5611, "learning_rate": 5e-06, "epoch": 0.07705008255365987, "percentage": 2.57, "elapsed_time": "0:09:52", "remaining_time": "6:14:27"}
{"current_steps": 80, "total_steps": 2724, "loss": 0.5512, "learning_rate": 5e-06, "epoch": 0.08805723720418272, "percentage": 2.94, "elapsed_time": "0:11:16", "remaining_time": "6:12:22"}
{"current_steps": 90, "total_steps": 2724, "loss": 0.5485, "learning_rate": 5e-06, "epoch": 0.09906439185470556, "percentage": 3.3, "elapsed_time": "0:12:39", "remaining_time": "6:10:30"}
{"current_steps": 100, "total_steps": 2724, "loss": 0.5509, "learning_rate": 5e-06, "epoch": 0.1100715465052284, "percentage": 3.67, "elapsed_time": "0:14:03", "remaining_time": "6:08:44"}
{"current_steps": 110, "total_steps": 2724, "loss": 0.5408, "learning_rate": 5e-06, "epoch": 0.12107870115575124, "percentage": 4.04, "elapsed_time": "0:15:26", "remaining_time": "6:06:54"}
{"current_steps": 120, "total_steps": 2724, "loss": 0.5454, "learning_rate": 5e-06, "epoch": 0.13208585580627408, "percentage": 4.41, "elapsed_time": "0:16:49", "remaining_time": "6:05:11"}
{"current_steps": 130, "total_steps": 2724, "loss": 0.547, "learning_rate": 5e-06, "epoch": 0.14309301045679693, "percentage": 4.77, "elapsed_time": "0:18:13", "remaining_time": "6:03:33"}
{"current_steps": 140, "total_steps": 2724, "loss": 0.5355, "learning_rate": 5e-06, "epoch": 0.15410016510731975, "percentage": 5.14, "elapsed_time": "0:19:36", "remaining_time": "6:01:58"}
{"current_steps": 150, "total_steps": 2724, "loss": 0.5401, "learning_rate": 5e-06, "epoch": 0.1651073197578426, "percentage": 5.51, "elapsed_time": "0:21:00", "remaining_time": "6:00:21"}
{"current_steps": 160, "total_steps": 2724, "loss": 0.5382, "learning_rate": 5e-06, "epoch": 0.17611447440836545, "percentage": 5.87, "elapsed_time": "0:22:23", "remaining_time": "5:58:43"}
{"current_steps": 170, "total_steps": 2724, "loss": 0.5375, "learning_rate": 5e-06, "epoch": 0.18712162905888827, "percentage": 6.24, "elapsed_time": "0:23:45", "remaining_time": "5:57:02"}
{"current_steps": 180, "total_steps": 2724, "loss": 0.5293, "learning_rate": 5e-06, "epoch": 0.19812878370941112, "percentage": 6.61, "elapsed_time": "0:25:08", "remaining_time": "5:55:23"}
{"current_steps": 190, "total_steps": 2724, "loss": 0.529, "learning_rate": 5e-06, "epoch": 0.20913593835993396, "percentage": 6.98, "elapsed_time": "0:26:31", "remaining_time": "5:53:48"}
{"current_steps": 200, "total_steps": 2724, "loss": 0.5374, "learning_rate": 5e-06, "epoch": 0.2201430930104568, "percentage": 7.34, "elapsed_time": "0:27:55", "remaining_time": "5:52:19"}
{"current_steps": 210, "total_steps": 2724, "loss": 0.5244, "learning_rate": 5e-06, "epoch": 0.23115024766097964, "percentage": 7.71, "elapsed_time": "0:29:18", "remaining_time": "5:50:51"}
{"current_steps": 220, "total_steps": 2724, "loss": 0.5239, "learning_rate": 5e-06, "epoch": 0.24215740231150248, "percentage": 8.08, "elapsed_time": "0:30:42", "remaining_time": "5:49:27"}
{"current_steps": 230, "total_steps": 2724, "loss": 0.5208, "learning_rate": 5e-06, "epoch": 0.25316455696202533, "percentage": 8.44, "elapsed_time": "0:32:05", "remaining_time": "5:47:59"}
{"current_steps": 240, "total_steps": 2724, "loss": 0.5235, "learning_rate": 5e-06, "epoch": 0.26417171161254815, "percentage": 8.81, "elapsed_time": "0:33:28", "remaining_time": "5:46:30"}
{"current_steps": 250, "total_steps": 2724, "loss": 0.5208, "learning_rate": 5e-06, "epoch": 0.275178866263071, "percentage": 9.18, "elapsed_time": "0:34:52", "remaining_time": "5:45:04"}
{"current_steps": 260, "total_steps": 2724, "loss": 0.5221, "learning_rate": 5e-06, "epoch": 0.28618602091359385, "percentage": 9.54, "elapsed_time": "0:36:15", "remaining_time": "5:43:41"}
{"current_steps": 270, "total_steps": 2724, "loss": 0.5208, "learning_rate": 5e-06, "epoch": 0.2971931755641167, "percentage": 9.91, "elapsed_time": "0:37:39", "remaining_time": "5:42:15"}
{"current_steps": 280, "total_steps": 2724, "loss": 0.5197, "learning_rate": 5e-06, "epoch": 0.3082003302146395, "percentage": 10.28, "elapsed_time": "0:39:02", "remaining_time": "5:40:49"}
{"current_steps": 290, "total_steps": 2724, "loss": 0.5184, "learning_rate": 5e-06, "epoch": 0.31920748486516237, "percentage": 10.65, "elapsed_time": "0:40:26", "remaining_time": "5:39:23"}
{"current_steps": 300, "total_steps": 2724, "loss": 0.5212, "learning_rate": 5e-06, "epoch": 0.3302146395156852, "percentage": 11.01, "elapsed_time": "0:41:49", "remaining_time": "5:37:57"}
{"current_steps": 310, "total_steps": 2724, "loss": 0.5184, "learning_rate": 5e-06, "epoch": 0.341221794166208, "percentage": 11.38, "elapsed_time": "0:43:13", "remaining_time": "5:36:31"}
{"current_steps": 320, "total_steps": 2724, "loss": 0.5117, "learning_rate": 5e-06, "epoch": 0.3522289488167309, "percentage": 11.75, "elapsed_time": "0:44:36", "remaining_time": "5:35:06"}
{"current_steps": 330, "total_steps": 2724, "loss": 0.5168, "learning_rate": 5e-06, "epoch": 0.3632361034672537, "percentage": 12.11, "elapsed_time": "0:45:59", "remaining_time": "5:33:41"}
{"current_steps": 340, "total_steps": 2724, "loss": 0.5112, "learning_rate": 5e-06, "epoch": 0.37424325811777653, "percentage": 12.48, "elapsed_time": "0:47:23", "remaining_time": "5:32:16"}
{"current_steps": 350, "total_steps": 2724, "loss": 0.5093, "learning_rate": 5e-06, "epoch": 0.3852504127682994, "percentage": 12.85, "elapsed_time": "0:48:46", "remaining_time": "5:30:50"}
{"current_steps": 360, "total_steps": 2724, "loss": 0.5089, "learning_rate": 5e-06, "epoch": 0.39625756741882223, "percentage": 13.22, "elapsed_time": "0:50:10", "remaining_time": "5:29:25"}
{"current_steps": 370, "total_steps": 2724, "loss": 0.5119, "learning_rate": 5e-06, "epoch": 0.40726472206934505, "percentage": 13.58, "elapsed_time": "0:51:33", "remaining_time": "5:28:02"}
{"current_steps": 380, "total_steps": 2724, "loss": 0.5114, "learning_rate": 5e-06, "epoch": 0.41827187671986793, "percentage": 13.95, "elapsed_time": "0:52:57", "remaining_time": "5:26:39"}
{"current_steps": 390, "total_steps": 2724, "loss": 0.5099, "learning_rate": 5e-06, "epoch": 0.42927903137039075, "percentage": 14.32, "elapsed_time": "0:54:21", "remaining_time": "5:25:17"}
{"current_steps": 400, "total_steps": 2724, "loss": 0.5052, "learning_rate": 5e-06, "epoch": 0.4402861860209136, "percentage": 14.68, "elapsed_time": "0:55:45", "remaining_time": "5:23:57"}
{"current_steps": 410, "total_steps": 2724, "loss": 0.5101, "learning_rate": 5e-06, "epoch": 0.45129334067143645, "percentage": 15.05, "elapsed_time": "0:57:09", "remaining_time": "5:22:37"}
{"current_steps": 420, "total_steps": 2724, "loss": 0.5052, "learning_rate": 5e-06, "epoch": 0.46230049532195927, "percentage": 15.42, "elapsed_time": "0:58:34", "remaining_time": "5:21:17"}
{"current_steps": 430, "total_steps": 2724, "loss": 0.5071, "learning_rate": 5e-06, "epoch": 0.4733076499724821, "percentage": 15.79, "elapsed_time": "0:59:58", "remaining_time": "5:19:57"}
{"current_steps": 440, "total_steps": 2724, "loss": 0.5087, "learning_rate": 5e-06, "epoch": 0.48431480462300497, "percentage": 16.15, "elapsed_time": "1:01:22", "remaining_time": "5:18:36"}
{"current_steps": 450, "total_steps": 2724, "loss": 0.5037, "learning_rate": 5e-06, "epoch": 0.4953219592735278, "percentage": 16.52, "elapsed_time": "1:02:46", "remaining_time": "5:17:12"}
{"current_steps": 460, "total_steps": 2724, "loss": 0.5017, "learning_rate": 5e-06, "epoch": 0.5063291139240507, "percentage": 16.89, "elapsed_time": "1:04:09", "remaining_time": "5:15:46"}
{"current_steps": 470, "total_steps": 2724, "loss": 0.5027, "learning_rate": 5e-06, "epoch": 0.5173362685745735, "percentage": 17.25, "elapsed_time": "1:05:33", "remaining_time": "5:14:22"}
{"current_steps": 480, "total_steps": 2724, "loss": 0.4956, "learning_rate": 5e-06, "epoch": 0.5283434232250963, "percentage": 17.62, "elapsed_time": "1:06:57", "remaining_time": "5:13:00"}
{"current_steps": 490, "total_steps": 2724, "loss": 0.508, "learning_rate": 5e-06, "epoch": 0.5393505778756191, "percentage": 17.99, "elapsed_time": "1:08:21", "remaining_time": "5:11:37"}
{"current_steps": 500, "total_steps": 2724, "loss": 0.5055, "learning_rate": 5e-06, "epoch": 0.550357732526142, "percentage": 18.36, "elapsed_time": "1:09:44", "remaining_time": "5:10:13"}
{"current_steps": 510, "total_steps": 2724, "loss": 0.5039, "learning_rate": 5e-06, "epoch": 0.5613648871766649, "percentage": 18.72, "elapsed_time": "1:11:07", "remaining_time": "5:08:47"}
{"current_steps": 520, "total_steps": 2724, "loss": 0.4977, "learning_rate": 5e-06, "epoch": 0.5723720418271877, "percentage": 19.09, "elapsed_time": "1:12:31", "remaining_time": "5:07:22"}
{"current_steps": 530, "total_steps": 2724, "loss": 0.4998, "learning_rate": 5e-06, "epoch": 0.5833791964777105, "percentage": 19.46, "elapsed_time": "1:13:54", "remaining_time": "5:05:58"}
{"current_steps": 540, "total_steps": 2724, "loss": 0.5056, "learning_rate": 5e-06, "epoch": 0.5943863511282333, "percentage": 19.82, "elapsed_time": "1:15:18", "remaining_time": "5:04:36"}
{"current_steps": 550, "total_steps": 2724, "loss": 0.4987, "learning_rate": 5e-06, "epoch": 0.6053935057787562, "percentage": 20.19, "elapsed_time": "1:16:42", "remaining_time": "5:03:12"}
{"current_steps": 560, "total_steps": 2724, "loss": 0.501, "learning_rate": 5e-06, "epoch": 0.616400660429279, "percentage": 20.56, "elapsed_time": "1:18:06", "remaining_time": "5:01:50"}
{"current_steps": 570, "total_steps": 2724, "loss": 0.4962, "learning_rate": 5e-06, "epoch": 0.6274078150798019, "percentage": 20.93, "elapsed_time": "1:19:30", "remaining_time": "5:00:26"}
{"current_steps": 580, "total_steps": 2724, "loss": 0.4999, "learning_rate": 5e-06, "epoch": 0.6384149697303247, "percentage": 21.29, "elapsed_time": "1:20:53", "remaining_time": "4:59:02"}
{"current_steps": 590, "total_steps": 2724, "loss": 0.5039, "learning_rate": 5e-06, "epoch": 0.6494221243808476, "percentage": 21.66, "elapsed_time": "1:22:17", "remaining_time": "4:57:38"}
{"current_steps": 600, "total_steps": 2724, "loss": 0.4997, "learning_rate": 5e-06, "epoch": 0.6604292790313704, "percentage": 22.03, "elapsed_time": "1:23:40", "remaining_time": "4:56:14"}
{"current_steps": 610, "total_steps": 2724, "loss": 0.4953, "learning_rate": 5e-06, "epoch": 0.6714364336818932, "percentage": 22.39, "elapsed_time": "1:25:04", "remaining_time": "4:54:50"}
{"current_steps": 620, "total_steps": 2724, "loss": 0.492, "learning_rate": 5e-06, "epoch": 0.682443588332416, "percentage": 22.76, "elapsed_time": "1:26:27", "remaining_time": "4:53:25"}
{"current_steps": 630, "total_steps": 2724, "loss": 0.4953, "learning_rate": 5e-06, "epoch": 0.693450742982939, "percentage": 23.13, "elapsed_time": "1:27:51", "remaining_time": "4:52:00"}
{"current_steps": 640, "total_steps": 2724, "loss": 0.4889, "learning_rate": 5e-06, "epoch": 0.7044578976334618, "percentage": 23.49, "elapsed_time": "1:29:14", "remaining_time": "4:50:35"}
{"current_steps": 650, "total_steps": 2724, "loss": 0.5007, "learning_rate": 5e-06, "epoch": 0.7154650522839846, "percentage": 23.86, "elapsed_time": "1:30:37", "remaining_time": "4:49:10"}
{"current_steps": 660, "total_steps": 2724, "loss": 0.4938, "learning_rate": 5e-06, "epoch": 0.7264722069345074, "percentage": 24.23, "elapsed_time": "1:32:01", "remaining_time": "4:47:46"}
{"current_steps": 670, "total_steps": 2724, "loss": 0.4999, "learning_rate": 5e-06, "epoch": 0.7374793615850302, "percentage": 24.6, "elapsed_time": "1:33:24", "remaining_time": "4:46:22"}
{"current_steps": 680, "total_steps": 2724, "loss": 0.502, "learning_rate": 5e-06, "epoch": 0.7484865162355531, "percentage": 24.96, "elapsed_time": "1:34:48", "remaining_time": "4:44:59"}
{"current_steps": 690, "total_steps": 2724, "loss": 0.4967, "learning_rate": 5e-06, "epoch": 0.759493670886076, "percentage": 25.33, "elapsed_time": "1:36:13", "remaining_time": "4:43:38"}
{"current_steps": 700, "total_steps": 2724, "loss": 0.4927, "learning_rate": 5e-06, "epoch": 0.7705008255365988, "percentage": 25.7, "elapsed_time": "1:37:36", "remaining_time": "4:42:15"}
{"current_steps": 710, "total_steps": 2724, "loss": 0.4896, "learning_rate": 5e-06, "epoch": 0.7815079801871216, "percentage": 26.06, "elapsed_time": "1:39:00", "remaining_time": "4:40:51"}
{"current_steps": 720, "total_steps": 2724, "loss": 0.4897, "learning_rate": 5e-06, "epoch": 0.7925151348376445, "percentage": 26.43, "elapsed_time": "1:40:24", "remaining_time": "4:39:28"}
{"current_steps": 730, "total_steps": 2724, "loss": 0.488, "learning_rate": 5e-06, "epoch": 0.8035222894881673, "percentage": 26.8, "elapsed_time": "1:41:48", "remaining_time": "4:38:04"}
{"current_steps": 740, "total_steps": 2724, "loss": 0.4934, "learning_rate": 5e-06, "epoch": 0.8145294441386901, "percentage": 27.17, "elapsed_time": "1:43:12", "remaining_time": "4:36:42"}
{"current_steps": 750, "total_steps": 2724, "loss": 0.4892, "learning_rate": 5e-06, "epoch": 0.825536598789213, "percentage": 27.53, "elapsed_time": "1:44:36", "remaining_time": "4:35:19"}
{"current_steps": 760, "total_steps": 2724, "loss": 0.479, "learning_rate": 5e-06, "epoch": 0.8365437534397359, "percentage": 27.9, "elapsed_time": "1:46:00", "remaining_time": "4:33:56"}
{"current_steps": 770, "total_steps": 2724, "loss": 0.4918, "learning_rate": 5e-06, "epoch": 0.8475509080902587, "percentage": 28.27, "elapsed_time": "1:47:24", "remaining_time": "4:32:33"}
{"current_steps": 780, "total_steps": 2724, "loss": 0.4936, "learning_rate": 5e-06, "epoch": 0.8585580627407815, "percentage": 28.63, "elapsed_time": "1:48:48", "remaining_time": "4:31:10"}
{"current_steps": 790, "total_steps": 2724, "loss": 0.4912, "learning_rate": 5e-06, "epoch": 0.8695652173913043, "percentage": 29.0, "elapsed_time": "1:50:11", "remaining_time": "4:29:46"}
{"current_steps": 800, "total_steps": 2724, "loss": 0.4874, "learning_rate": 5e-06, "epoch": 0.8805723720418271, "percentage": 29.37, "elapsed_time": "1:51:35", "remaining_time": "4:28:23"}
{"current_steps": 810, "total_steps": 2724, "loss": 0.4898, "learning_rate": 5e-06, "epoch": 0.8915795266923501, "percentage": 29.74, "elapsed_time": "1:53:00", "remaining_time": "4:27:01"}
{"current_steps": 820, "total_steps": 2724, "loss": 0.4871, "learning_rate": 5e-06, "epoch": 0.9025866813428729, "percentage": 30.1, "elapsed_time": "1:54:24", "remaining_time": "4:25:38"}
{"current_steps": 830, "total_steps": 2724, "loss": 0.4874, "learning_rate": 5e-06, "epoch": 0.9135938359933957, "percentage": 30.47, "elapsed_time": "1:55:47", "remaining_time": "4:24:14"}
{"current_steps": 840, "total_steps": 2724, "loss": 0.4833, "learning_rate": 5e-06, "epoch": 0.9246009906439185, "percentage": 30.84, "elapsed_time": "1:57:11", "remaining_time": "4:22:49"}
{"current_steps": 850, "total_steps": 2724, "loss": 0.4854, "learning_rate": 5e-06, "epoch": 0.9356081452944414, "percentage": 31.2, "elapsed_time": "1:58:34", "remaining_time": "4:21:24"}
{"current_steps": 860, "total_steps": 2724, "loss": 0.4891, "learning_rate": 5e-06, "epoch": 0.9466152999449642, "percentage": 31.57, "elapsed_time": "1:59:57", "remaining_time": "4:20:00"}
{"current_steps": 870, "total_steps": 2724, "loss": 0.486, "learning_rate": 5e-06, "epoch": 0.9576224545954871, "percentage": 31.94, "elapsed_time": "2:01:20", "remaining_time": "4:18:35"}
{"current_steps": 880, "total_steps": 2724, "loss": 0.4865, "learning_rate": 5e-06, "epoch": 0.9686296092460099, "percentage": 32.31, "elapsed_time": "2:02:43", "remaining_time": "4:17:10"}
{"current_steps": 890, "total_steps": 2724, "loss": 0.487, "learning_rate": 5e-06, "epoch": 0.9796367638965328, "percentage": 32.67, "elapsed_time": "2:04:06", "remaining_time": "4:15:45"}
{"current_steps": 900, "total_steps": 2724, "loss": 0.4816, "learning_rate": 5e-06, "epoch": 0.9906439185470556, "percentage": 33.04, "elapsed_time": "2:05:30", "remaining_time": "4:14:21"}
{"current_steps": 908, "total_steps": 2724, "eval_loss": 0.4856513738632202, "epoch": 0.9994496422674739, "percentage": 33.33, "elapsed_time": "2:09:20", "remaining_time": "4:18:41"}
{"current_steps": 910, "total_steps": 2724, "loss": 0.481, "learning_rate": 5e-06, "epoch": 1.0016510731975785, "percentage": 33.41, "elapsed_time": "2:10:26", "remaining_time": "4:20:00"}
{"current_steps": 920, "total_steps": 2724, "loss": 0.4391, "learning_rate": 5e-06, "epoch": 1.0126582278481013, "percentage": 33.77, "elapsed_time": "2:11:48", "remaining_time": "4:18:28"}
{"current_steps": 930, "total_steps": 2724, "loss": 0.4375, "learning_rate": 5e-06, "epoch": 1.0236653824986242, "percentage": 34.14, "elapsed_time": "2:13:12", "remaining_time": "4:16:57"}
{"current_steps": 940, "total_steps": 2724, "loss": 0.4384, "learning_rate": 5e-06, "epoch": 1.034672537149147, "percentage": 34.51, "elapsed_time": "2:14:35", "remaining_time": "4:15:26"}
{"current_steps": 950, "total_steps": 2724, "loss": 0.4369, "learning_rate": 5e-06, "epoch": 1.0456796917996698, "percentage": 34.88, "elapsed_time": "2:15:58", "remaining_time": "4:13:55"}
{"current_steps": 960, "total_steps": 2724, "loss": 0.4355, "learning_rate": 5e-06, "epoch": 1.0566868464501926, "percentage": 35.24, "elapsed_time": "2:17:22", "remaining_time": "4:12:25"}
{"current_steps": 970, "total_steps": 2724, "loss": 0.4355, "learning_rate": 5e-06, "epoch": 1.0676940011007154, "percentage": 35.61, "elapsed_time": "2:18:45", "remaining_time": "4:10:55"}
{"current_steps": 980, "total_steps": 2724, "loss": 0.438, "learning_rate": 5e-06, "epoch": 1.0787011557512383, "percentage": 35.98, "elapsed_time": "2:20:09", "remaining_time": "4:09:25"}
{"current_steps": 990, "total_steps": 2724, "loss": 0.4382, "learning_rate": 5e-06, "epoch": 1.089708310401761, "percentage": 36.34, "elapsed_time": "2:21:32", "remaining_time": "4:07:55"}
{"current_steps": 1000, "total_steps": 2724, "loss": 0.4402, "learning_rate": 5e-06, "epoch": 1.100715465052284, "percentage": 36.71, "elapsed_time": "2:22:56", "remaining_time": "4:06:25"}
{"current_steps": 1010, "total_steps": 2724, "loss": 0.4369, "learning_rate": 5e-06, "epoch": 1.1117226197028067, "percentage": 37.08, "elapsed_time": "2:24:19", "remaining_time": "4:04:55"}
{"current_steps": 1020, "total_steps": 2724, "loss": 0.4343, "learning_rate": 5e-06, "epoch": 1.1227297743533298, "percentage": 37.44, "elapsed_time": "2:25:43", "remaining_time": "4:03:27"}
{"current_steps": 1030, "total_steps": 2724, "loss": 0.4407, "learning_rate": 5e-06, "epoch": 1.1337369290038526, "percentage": 37.81, "elapsed_time": "2:27:07", "remaining_time": "4:01:58"}
{"current_steps": 1040, "total_steps": 2724, "loss": 0.438, "learning_rate": 5e-06, "epoch": 1.1447440836543754, "percentage": 38.18, "elapsed_time": "2:28:31", "remaining_time": "4:00:30"}
{"current_steps": 1050, "total_steps": 2724, "loss": 0.4382, "learning_rate": 5e-06, "epoch": 1.1557512383048982, "percentage": 38.55, "elapsed_time": "2:29:55", "remaining_time": "3:59:00"}
{"current_steps": 1060, "total_steps": 2724, "loss": 0.442, "learning_rate": 5e-06, "epoch": 1.166758392955421, "percentage": 38.91, "elapsed_time": "2:31:18", "remaining_time": "3:57:31"}
{"current_steps": 1070, "total_steps": 2724, "loss": 0.4338, "learning_rate": 5e-06, "epoch": 1.1777655476059439, "percentage": 39.28, "elapsed_time": "2:32:41", "remaining_time": "3:56:02"}
{"current_steps": 1080, "total_steps": 2724, "loss": 0.435, "learning_rate": 5e-06, "epoch": 1.1887727022564667, "percentage": 39.65, "elapsed_time": "2:34:04", "remaining_time": "3:54:32"}
{"current_steps": 1090, "total_steps": 2724, "loss": 0.4422, "learning_rate": 5e-06, "epoch": 1.1997798569069895, "percentage": 40.01, "elapsed_time": "2:35:28", "remaining_time": "3:53:03"}
{"current_steps": 1100, "total_steps": 2724, "loss": 0.4372, "learning_rate": 5e-06, "epoch": 1.2107870115575123, "percentage": 40.38, "elapsed_time": "2:36:51", "remaining_time": "3:51:34"}
{"current_steps": 1110, "total_steps": 2724, "loss": 0.4321, "learning_rate": 5e-06, "epoch": 1.2217941662080352, "percentage": 40.75, "elapsed_time": "2:38:14", "remaining_time": "3:50:05"}
{"current_steps": 1120, "total_steps": 2724, "loss": 0.439, "learning_rate": 5e-06, "epoch": 1.232801320858558, "percentage": 41.12, "elapsed_time": "2:39:36", "remaining_time": "3:48:35"}
{"current_steps": 1130, "total_steps": 2724, "loss": 0.4391, "learning_rate": 5e-06, "epoch": 1.243808475509081, "percentage": 41.48, "elapsed_time": "2:41:00", "remaining_time": "3:47:06"}
{"current_steps": 1140, "total_steps": 2724, "loss": 0.4358, "learning_rate": 5e-06, "epoch": 1.2548156301596038, "percentage": 41.85, "elapsed_time": "2:42:23", "remaining_time": "3:45:38"}
{"current_steps": 1150, "total_steps": 2724, "loss": 0.4357, "learning_rate": 5e-06, "epoch": 1.2658227848101267, "percentage": 42.22, "elapsed_time": "2:43:46", "remaining_time": "3:44:09"}
{"current_steps": 1160, "total_steps": 2724, "loss": 0.4377, "learning_rate": 5e-06, "epoch": 1.2768299394606495, "percentage": 42.58, "elapsed_time": "2:45:10", "remaining_time": "3:42:41"}
{"current_steps": 1170, "total_steps": 2724, "loss": 0.4373, "learning_rate": 5e-06, "epoch": 1.2878370941111723, "percentage": 42.95, "elapsed_time": "2:46:33", "remaining_time": "3:41:13"}
{"current_steps": 1180, "total_steps": 2724, "loss": 0.4397, "learning_rate": 5e-06, "epoch": 1.2988442487616951, "percentage": 43.32, "elapsed_time": "2:47:56", "remaining_time": "3:39:45"}
{"current_steps": 1190, "total_steps": 2724, "loss": 0.4317, "learning_rate": 5e-06, "epoch": 1.309851403412218, "percentage": 43.69, "elapsed_time": "2:49:19", "remaining_time": "3:38:16"}
{"current_steps": 1200, "total_steps": 2724, "loss": 0.4388, "learning_rate": 5e-06, "epoch": 1.3208585580627408, "percentage": 44.05, "elapsed_time": "2:50:43", "remaining_time": "3:36:48"}
{"current_steps": 1210, "total_steps": 2724, "loss": 0.4296, "learning_rate": 5e-06, "epoch": 1.3318657127132636, "percentage": 44.42, "elapsed_time": "2:52:06", "remaining_time": "3:35:20"}
{"current_steps": 1220, "total_steps": 2724, "loss": 0.4399, "learning_rate": 5e-06, "epoch": 1.3428728673637864, "percentage": 44.79, "elapsed_time": "2:53:29", "remaining_time": "3:33:53"}
{"current_steps": 1230, "total_steps": 2724, "loss": 0.4364, "learning_rate": 5e-06, "epoch": 1.3538800220143092, "percentage": 45.15, "elapsed_time": "2:54:53", "remaining_time": "3:32:25"}
{"current_steps": 1240, "total_steps": 2724, "loss": 0.4379, "learning_rate": 5e-06, "epoch": 1.364887176664832, "percentage": 45.52, "elapsed_time": "2:56:16", "remaining_time": "3:30:57"}
{"current_steps": 1250, "total_steps": 2724, "loss": 0.4417, "learning_rate": 5e-06, "epoch": 1.3758943313153549, "percentage": 45.89, "elapsed_time": "2:57:39", "remaining_time": "3:29:29"}
{"current_steps": 1260, "total_steps": 2724, "loss": 0.44, "learning_rate": 5e-06, "epoch": 1.3869014859658777, "percentage": 46.26, "elapsed_time": "2:59:03", "remaining_time": "3:28:02"}
{"current_steps": 1270, "total_steps": 2724, "loss": 0.438, "learning_rate": 5e-06, "epoch": 1.3979086406164005, "percentage": 46.62, "elapsed_time": "3:00:26", "remaining_time": "3:26:34"}
{"current_steps": 1280, "total_steps": 2724, "loss": 0.4354, "learning_rate": 5e-06, "epoch": 1.4089157952669236, "percentage": 46.99, "elapsed_time": "3:01:49", "remaining_time": "3:25:07"}
{"current_steps": 1290, "total_steps": 2724, "loss": 0.4364, "learning_rate": 5e-06, "epoch": 1.4199229499174464, "percentage": 47.36, "elapsed_time": "3:03:13", "remaining_time": "3:23:40"}
{"current_steps": 1300, "total_steps": 2724, "loss": 0.433, "learning_rate": 5e-06, "epoch": 1.4309301045679692, "percentage": 47.72, "elapsed_time": "3:04:36", "remaining_time": "3:22:12"}
{"current_steps": 1310, "total_steps": 2724, "loss": 0.4305, "learning_rate": 5e-06, "epoch": 1.441937259218492, "percentage": 48.09, "elapsed_time": "3:05:59", "remaining_time": "3:20:45"}
{"current_steps": 1320, "total_steps": 2724, "loss": 0.4372, "learning_rate": 5e-06, "epoch": 1.4529444138690149, "percentage": 48.46, "elapsed_time": "3:07:23", "remaining_time": "3:19:18"}
{"current_steps": 1330, "total_steps": 2724, "loss": 0.4317, "learning_rate": 5e-06, "epoch": 1.4639515685195377, "percentage": 48.83, "elapsed_time": "3:08:46", "remaining_time": "3:17:51"}
{"current_steps": 1340, "total_steps": 2724, "loss": 0.4393, "learning_rate": 5e-06, "epoch": 1.4749587231700605, "percentage": 49.19, "elapsed_time": "3:10:09", "remaining_time": "3:16:24"}
{"current_steps": 1350, "total_steps": 2724, "loss": 0.4341, "learning_rate": 5e-06, "epoch": 1.4859658778205833, "percentage": 49.56, "elapsed_time": "3:11:32", "remaining_time": "3:14:57"}
{"current_steps": 1360, "total_steps": 2724, "loss": 0.4356, "learning_rate": 5e-06, "epoch": 1.4969730324711064, "percentage": 49.93, "elapsed_time": "3:12:55", "remaining_time": "3:13:29"}
{"current_steps": 1370, "total_steps": 2724, "loss": 0.4362, "learning_rate": 5e-06, "epoch": 1.5079801871216292, "percentage": 50.29, "elapsed_time": "3:14:19", "remaining_time": "3:12:02"}
{"current_steps": 1380, "total_steps": 2724, "loss": 0.4382, "learning_rate": 5e-06, "epoch": 1.518987341772152, "percentage": 50.66, "elapsed_time": "3:15:43", "remaining_time": "3:10:36"}
{"current_steps": 1390, "total_steps": 2724, "loss": 0.4273, "learning_rate": 5e-06, "epoch": 1.5299944964226748, "percentage": 51.03, "elapsed_time": "3:17:07", "remaining_time": "3:09:10"}
{"current_steps": 1400, "total_steps": 2724, "loss": 0.4299, "learning_rate": 5e-06, "epoch": 1.5410016510731976, "percentage": 51.4, "elapsed_time": "3:18:31", "remaining_time": "3:07:44"}
{"current_steps": 1410, "total_steps": 2724, "loss": 0.4341, "learning_rate": 5e-06, "epoch": 1.5520088057237205, "percentage": 51.76, "elapsed_time": "3:19:55", "remaining_time": "3:06:18"}
{"current_steps": 1420, "total_steps": 2724, "loss": 0.4365, "learning_rate": 5e-06, "epoch": 1.5630159603742433, "percentage": 52.13, "elapsed_time": "3:21:19", "remaining_time": "3:04:52"}
{"current_steps": 1430, "total_steps": 2724, "loss": 0.4351, "learning_rate": 5e-06, "epoch": 1.574023115024766, "percentage": 52.5, "elapsed_time": "3:22:42", "remaining_time": "3:03:26"}
{"current_steps": 1440, "total_steps": 2724, "loss": 0.4331, "learning_rate": 5e-06, "epoch": 1.585030269675289, "percentage": 52.86, "elapsed_time": "3:24:06", "remaining_time": "3:01:59"}
{"current_steps": 1450, "total_steps": 2724, "loss": 0.4292, "learning_rate": 5e-06, "epoch": 1.5960374243258117, "percentage": 53.23, "elapsed_time": "3:25:29", "remaining_time": "3:00:33"}
{"current_steps": 1460, "total_steps": 2724, "loss": 0.4366, "learning_rate": 5e-06, "epoch": 1.6070445789763346, "percentage": 53.6, "elapsed_time": "3:26:53", "remaining_time": "2:59:07"}
{"current_steps": 1470, "total_steps": 2724, "loss": 0.4361, "learning_rate": 5e-06, "epoch": 1.6180517336268574, "percentage": 53.96, "elapsed_time": "3:28:17", "remaining_time": "2:57:40"}
{"current_steps": 1480, "total_steps": 2724, "loss": 0.4308, "learning_rate": 5e-06, "epoch": 1.6290588882773802, "percentage": 54.33, "elapsed_time": "3:29:40", "remaining_time": "2:56:14"}
{"current_steps": 1490, "total_steps": 2724, "loss": 0.4312, "learning_rate": 5e-06, "epoch": 1.640066042927903, "percentage": 54.7, "elapsed_time": "3:31:03", "remaining_time": "2:54:48"}
{"current_steps": 1500, "total_steps": 2724, "loss": 0.4332, "learning_rate": 5e-06, "epoch": 1.6510731975784259, "percentage": 55.07, "elapsed_time": "3:32:27", "remaining_time": "2:53:21"}
{"current_steps": 1510, "total_steps": 2724, "loss": 0.4329, "learning_rate": 5e-06, "epoch": 1.6620803522289487, "percentage": 55.43, "elapsed_time": "3:33:50", "remaining_time": "2:51:55"}
{"current_steps": 1520, "total_steps": 2724, "loss": 0.4323, "learning_rate": 5e-06, "epoch": 1.6730875068794715, "percentage": 55.8, "elapsed_time": "3:35:13", "remaining_time": "2:50:29"}
{"current_steps": 1530, "total_steps": 2724, "loss": 0.4364, "learning_rate": 5e-06, "epoch": 1.6840946615299945, "percentage": 56.17, "elapsed_time": "3:36:37", "remaining_time": "2:49:03"}
{"current_steps": 1540, "total_steps": 2724, "loss": 0.4313, "learning_rate": 5e-06, "epoch": 1.6951018161805174, "percentage": 56.53, "elapsed_time": "3:38:01", "remaining_time": "2:47:37"}
{"current_steps": 1550, "total_steps": 2724, "loss": 0.4307, "learning_rate": 5e-06, "epoch": 1.7061089708310402, "percentage": 56.9, "elapsed_time": "3:39:25", "remaining_time": "2:46:12"}
{"current_steps": 1560, "total_steps": 2724, "loss": 0.4353, "learning_rate": 5e-06, "epoch": 1.717116125481563, "percentage": 57.27, "elapsed_time": "3:40:50", "remaining_time": "2:44:46"}
{"current_steps": 1570, "total_steps": 2724, "loss": 0.4328, "learning_rate": 5e-06, "epoch": 1.7281232801320858, "percentage": 57.64, "elapsed_time": "3:42:14", "remaining_time": "2:43:21"}
{"current_steps": 1580, "total_steps": 2724, "loss": 0.4287, "learning_rate": 5e-06, "epoch": 1.7391304347826086, "percentage": 58.0, "elapsed_time": "3:43:38", "remaining_time": "2:41:55"}
{"current_steps": 1590, "total_steps": 2724, "loss": 0.4362, "learning_rate": 5e-06, "epoch": 1.7501375894331317, "percentage": 58.37, "elapsed_time": "3:45:02", "remaining_time": "2:40:30"}
{"current_steps": 1600, "total_steps": 2724, "loss": 0.4295, "learning_rate": 5e-06, "epoch": 1.7611447440836545, "percentage": 58.74, "elapsed_time": "3:46:26", "remaining_time": "2:39:04"}
{"current_steps": 1610, "total_steps": 2724, "loss": 0.4298, "learning_rate": 5e-06, "epoch": 1.7721518987341773, "percentage": 59.1, "elapsed_time": "3:47:49", "remaining_time": "2:37:38"}
{"current_steps": 1620, "total_steps": 2724, "loss": 0.4298, "learning_rate": 5e-06, "epoch": 1.7831590533847002, "percentage": 59.47, "elapsed_time": "3:49:13", "remaining_time": "2:36:12"}
{"current_steps": 1630, "total_steps": 2724, "loss": 0.4317, "learning_rate": 5e-06, "epoch": 1.794166208035223, "percentage": 59.84, "elapsed_time": "3:50:36", "remaining_time": "2:34:46"}
{"current_steps": 1640, "total_steps": 2724, "loss": 0.4335, "learning_rate": 5e-06, "epoch": 1.8051733626857458, "percentage": 60.21, "elapsed_time": "3:51:59", "remaining_time": "2:33:20"}
{"current_steps": 1650, "total_steps": 2724, "loss": 0.4369, "learning_rate": 5e-06, "epoch": 1.8161805173362686, "percentage": 60.57, "elapsed_time": "3:53:23", "remaining_time": "2:31:54"}
{"current_steps": 1660, "total_steps": 2724, "loss": 0.4372, "learning_rate": 5e-06, "epoch": 1.8271876719867914, "percentage": 60.94, "elapsed_time": "3:54:46", "remaining_time": "2:30:28"}
{"current_steps": 1670, "total_steps": 2724, "loss": 0.4268, "learning_rate": 5e-06, "epoch": 1.8381948266373143, "percentage": 61.31, "elapsed_time": "3:56:09", "remaining_time": "2:29:02"}
{"current_steps": 1680, "total_steps": 2724, "loss": 0.4296, "learning_rate": 5e-06, "epoch": 1.849201981287837, "percentage": 61.67, "elapsed_time": "3:57:32", "remaining_time": "2:27:36"}
{"current_steps": 1690, "total_steps": 2724, "loss": 0.4359, "learning_rate": 5e-06, "epoch": 1.86020913593836, "percentage": 62.04, "elapsed_time": "3:58:55", "remaining_time": "2:26:11"}
{"current_steps": 1700, "total_steps": 2724, "loss": 0.438, "learning_rate": 5e-06, "epoch": 1.8712162905888827, "percentage": 62.41, "elapsed_time": "4:00:19", "remaining_time": "2:24:45"}
{"current_steps": 1710, "total_steps": 2724, "loss": 0.4312, "learning_rate": 5e-06, "epoch": 1.8822234452394055, "percentage": 62.78, "elapsed_time": "4:01:42", "remaining_time": "2:23:19"}
{"current_steps": 1720, "total_steps": 2724, "loss": 0.4336, "learning_rate": 5e-06, "epoch": 1.8932305998899284, "percentage": 63.14, "elapsed_time": "4:03:05", "remaining_time": "2:21:53"}
{"current_steps": 1730, "total_steps": 2724, "loss": 0.4296, "learning_rate": 5e-06, "epoch": 1.9042377545404512, "percentage": 63.51, "elapsed_time": "4:04:28", "remaining_time": "2:20:28"}
{"current_steps": 1740, "total_steps": 2724, "loss": 0.4305, "learning_rate": 5e-06, "epoch": 1.915244909190974, "percentage": 63.88, "elapsed_time": "4:05:52", "remaining_time": "2:19:02"}
{"current_steps": 1750, "total_steps": 2724, "loss": 0.4293, "learning_rate": 5e-06, "epoch": 1.9262520638414968, "percentage": 64.24, "elapsed_time": "4:07:15", "remaining_time": "2:17:37"}
{"current_steps": 1760, "total_steps": 2724, "loss": 0.4273, "learning_rate": 5e-06, "epoch": 1.9372592184920197, "percentage": 64.61, "elapsed_time": "4:08:38", "remaining_time": "2:16:11"}
{"current_steps": 1770, "total_steps": 2724, "loss": 0.4303, "learning_rate": 5e-06, "epoch": 1.9482663731425427, "percentage": 64.98, "elapsed_time": "4:10:00", "remaining_time": "2:14:45"}
{"current_steps": 1780, "total_steps": 2724, "loss": 0.4276, "learning_rate": 5e-06, "epoch": 1.9592735277930655, "percentage": 65.35, "elapsed_time": "4:11:23", "remaining_time": "2:13:19"}
{"current_steps": 1790, "total_steps": 2724, "loss": 0.43, "learning_rate": 5e-06, "epoch": 1.9702806824435883, "percentage": 65.71, "elapsed_time": "4:12:46", "remaining_time": "2:11:53"}
{"current_steps": 1800, "total_steps": 2724, "loss": 0.4291, "learning_rate": 5e-06, "epoch": 1.9812878370941112, "percentage": 66.08, "elapsed_time": "4:14:09", "remaining_time": "2:10:27"}
{"current_steps": 1810, "total_steps": 2724, "loss": 0.4296, "learning_rate": 5e-06, "epoch": 1.992294991744634, "percentage": 66.45, "elapsed_time": "4:15:32", "remaining_time": "2:09:02"}
{"current_steps": 1817, "total_steps": 2724, "eval_loss": 0.4724336564540863, "epoch": 2.0, "percentage": 66.7, "elapsed_time": "4:19:10", "remaining_time": "2:09:22"}
{"current_steps": 1820, "total_steps": 2724, "loss": 0.4165, "learning_rate": 5e-06, "epoch": 2.003302146395157, "percentage": 66.81, "elapsed_time": "4:20:34", "remaining_time": "2:09:25"}
{"current_steps": 1830, "total_steps": 2724, "loss": 0.379, "learning_rate": 5e-06, "epoch": 2.01430930104568, "percentage": 67.18, "elapsed_time": "4:21:57", "remaining_time": "2:07:58"}
{"current_steps": 1840, "total_steps": 2724, "loss": 0.3769, "learning_rate": 5e-06, "epoch": 2.0253164556962027, "percentage": 67.55, "elapsed_time": "4:23:20", "remaining_time": "2:06:31"}
{"current_steps": 1850, "total_steps": 2724, "loss": 0.3732, "learning_rate": 5e-06, "epoch": 2.0363236103467255, "percentage": 67.91, "elapsed_time": "4:24:43", "remaining_time": "2:05:03"}
{"current_steps": 1860, "total_steps": 2724, "loss": 0.379, "learning_rate": 5e-06, "epoch": 2.0473307649972483, "percentage": 68.28, "elapsed_time": "4:26:06", "remaining_time": "2:03:36"}
{"current_steps": 1870, "total_steps": 2724, "loss": 0.3792, "learning_rate": 5e-06, "epoch": 2.058337919647771, "percentage": 68.65, "elapsed_time": "4:27:29", "remaining_time": "2:02:09"}
{"current_steps": 1880, "total_steps": 2724, "loss": 0.379, "learning_rate": 5e-06, "epoch": 2.069345074298294, "percentage": 69.02, "elapsed_time": "4:28:53", "remaining_time": "2:00:42"}
{"current_steps": 1890, "total_steps": 2724, "loss": 0.378, "learning_rate": 5e-06, "epoch": 2.0803522289488168, "percentage": 69.38, "elapsed_time": "4:30:16", "remaining_time": "1:59:15"}
{"current_steps": 1900, "total_steps": 2724, "loss": 0.3776, "learning_rate": 5e-06, "epoch": 2.0913593835993396, "percentage": 69.75, "elapsed_time": "4:31:39", "remaining_time": "1:57:48"}
{"current_steps": 1910, "total_steps": 2724, "loss": 0.3737, "learning_rate": 5e-06, "epoch": 2.1023665382498624, "percentage": 70.12, "elapsed_time": "4:33:03", "remaining_time": "1:56:22"}
{"current_steps": 1920, "total_steps": 2724, "loss": 0.3772, "learning_rate": 5e-06, "epoch": 2.1133736929003852, "percentage": 70.48, "elapsed_time": "4:34:26", "remaining_time": "1:54:55"}
{"current_steps": 1930, "total_steps": 2724, "loss": 0.3701, "learning_rate": 5e-06, "epoch": 2.124380847550908, "percentage": 70.85, "elapsed_time": "4:35:49", "remaining_time": "1:53:28"}
{"current_steps": 1940, "total_steps": 2724, "loss": 0.3757, "learning_rate": 5e-06, "epoch": 2.135388002201431, "percentage": 71.22, "elapsed_time": "4:37:13", "remaining_time": "1:52:01"}
{"current_steps": 1950, "total_steps": 2724, "loss": 0.375, "learning_rate": 5e-06, "epoch": 2.1463951568519537, "percentage": 71.59, "elapsed_time": "4:38:36", "remaining_time": "1:50:34"}
{"current_steps": 1960, "total_steps": 2724, "loss": 0.3814, "learning_rate": 5e-06, "epoch": 2.1574023115024765, "percentage": 71.95, "elapsed_time": "4:39:58", "remaining_time": "1:49:08"}
{"current_steps": 1970, "total_steps": 2724, "loss": 0.3744, "learning_rate": 5e-06, "epoch": 2.1684094661529993, "percentage": 72.32, "elapsed_time": "4:41:21", "remaining_time": "1:47:41"}
{"current_steps": 1980, "total_steps": 2724, "loss": 0.3741, "learning_rate": 5e-06, "epoch": 2.179416620803522, "percentage": 72.69, "elapsed_time": "4:42:44", "remaining_time": "1:46:14"}
{"current_steps": 1990, "total_steps": 2724, "loss": 0.378, "learning_rate": 5e-06, "epoch": 2.190423775454045, "percentage": 73.05, "elapsed_time": "4:44:07", "remaining_time": "1:44:47"}
{"current_steps": 2000, "total_steps": 2724, "loss": 0.3769, "learning_rate": 5e-06, "epoch": 2.201430930104568, "percentage": 73.42, "elapsed_time": "4:45:30", "remaining_time": "1:43:21"}
{"current_steps": 2010, "total_steps": 2724, "loss": 0.3775, "learning_rate": 5e-06, "epoch": 2.2124380847550906, "percentage": 73.79, "elapsed_time": "4:46:53", "remaining_time": "1:41:54"}
{"current_steps": 2020, "total_steps": 2724, "loss": 0.3809, "learning_rate": 5e-06, "epoch": 2.2234452394056134, "percentage": 74.16, "elapsed_time": "4:48:16", "remaining_time": "1:40:28"}
{"current_steps": 2030, "total_steps": 2724, "loss": 0.3741, "learning_rate": 5e-06, "epoch": 2.2344523940561363, "percentage": 74.52, "elapsed_time": "4:49:39", "remaining_time": "1:39:01"}
{"current_steps": 2040, "total_steps": 2724, "loss": 0.3811, "learning_rate": 5e-06, "epoch": 2.2454595487066595, "percentage": 74.89, "elapsed_time": "4:51:02", "remaining_time": "1:37:34"}
{"current_steps": 2050, "total_steps": 2724, "loss": 0.3759, "learning_rate": 5e-06, "epoch": 2.2564667033571824, "percentage": 75.26, "elapsed_time": "4:52:25", "remaining_time": "1:36:08"}
{"current_steps": 2060, "total_steps": 2724, "loss": 0.3777, "learning_rate": 5e-06, "epoch": 2.267473858007705, "percentage": 75.62, "elapsed_time": "4:53:48", "remaining_time": "1:34:42"}
{"current_steps": 2070, "total_steps": 2724, "loss": 0.3809, "learning_rate": 5e-06, "epoch": 2.278481012658228, "percentage": 75.99, "elapsed_time": "4:55:12", "remaining_time": "1:33:15"}
{"current_steps": 2080, "total_steps": 2724, "loss": 0.3748, "learning_rate": 5e-06, "epoch": 2.289488167308751, "percentage": 76.36, "elapsed_time": "4:56:35", "remaining_time": "1:31:49"}
{"current_steps": 2090, "total_steps": 2724, "loss": 0.3774, "learning_rate": 5e-06, "epoch": 2.3004953219592736, "percentage": 76.73, "elapsed_time": "4:57:58", "remaining_time": "1:30:23"}
{"current_steps": 2100, "total_steps": 2724, "loss": 0.3802, "learning_rate": 5e-06, "epoch": 2.3115024766097965, "percentage": 77.09, "elapsed_time": "4:59:21", "remaining_time": "1:28:57"}
{"current_steps": 2110, "total_steps": 2724, "loss": 0.3835, "learning_rate": 5e-06, "epoch": 2.3225096312603193, "percentage": 77.46, "elapsed_time": "5:00:44", "remaining_time": "1:27:30"}
{"current_steps": 2120, "total_steps": 2724, "loss": 0.378, "learning_rate": 5e-06, "epoch": 2.333516785910842, "percentage": 77.83, "elapsed_time": "5:02:08", "remaining_time": "1:26:04"}
{"current_steps": 2130, "total_steps": 2724, "loss": 0.378, "learning_rate": 5e-06, "epoch": 2.344523940561365, "percentage": 78.19, "elapsed_time": "5:03:31", "remaining_time": "1:24:38"}
{"current_steps": 2140, "total_steps": 2724, "loss": 0.3854, "learning_rate": 5e-06, "epoch": 2.3555310952118877, "percentage": 78.56, "elapsed_time": "5:04:54", "remaining_time": "1:23:12"}
{"current_steps": 2150, "total_steps": 2724, "loss": 0.3818, "learning_rate": 5e-06, "epoch": 2.3665382498624106, "percentage": 78.93, "elapsed_time": "5:06:18", "remaining_time": "1:21:46"}
{"current_steps": 2160, "total_steps": 2724, "loss": 0.3818, "learning_rate": 5e-06, "epoch": 2.3775454045129334, "percentage": 79.3, "elapsed_time": "5:07:41", "remaining_time": "1:20:20"}
{"current_steps": 2170, "total_steps": 2724, "loss": 0.3772, "learning_rate": 5e-06, "epoch": 2.388552559163456, "percentage": 79.66, "elapsed_time": "5:09:04", "remaining_time": "1:18:54"}
{"current_steps": 2180, "total_steps": 2724, "loss": 0.3811, "learning_rate": 5e-06, "epoch": 2.399559713813979, "percentage": 80.03, "elapsed_time": "5:10:28", "remaining_time": "1:17:28"}
{"current_steps": 2190, "total_steps": 2724, "loss": 0.3783, "learning_rate": 5e-06, "epoch": 2.410566868464502, "percentage": 80.4, "elapsed_time": "5:11:51", "remaining_time": "1:16:02"}
{"current_steps": 2200, "total_steps": 2724, "loss": 0.3793, "learning_rate": 5e-06, "epoch": 2.4215740231150247, "percentage": 80.76, "elapsed_time": "5:13:14", "remaining_time": "1:14:36"}
{"current_steps": 2210, "total_steps": 2724, "loss": 0.3803, "learning_rate": 5e-06, "epoch": 2.4325811777655475, "percentage": 81.13, "elapsed_time": "5:14:37", "remaining_time": "1:13:10"}
{"current_steps": 2220, "total_steps": 2724, "loss": 0.3788, "learning_rate": 5e-06, "epoch": 2.4435883324160703, "percentage": 81.5, "elapsed_time": "5:16:01", "remaining_time": "1:11:44"}
{"current_steps": 2230, "total_steps": 2724, "loss": 0.3817, "learning_rate": 5e-06, "epoch": 2.454595487066593, "percentage": 81.86, "elapsed_time": "5:17:24", "remaining_time": "1:10:18"}
{"current_steps": 2240, "total_steps": 2724, "loss": 0.3778, "learning_rate": 5e-06, "epoch": 2.465602641717116, "percentage": 82.23, "elapsed_time": "5:18:47", "remaining_time": "1:08:52"}
{"current_steps": 2250, "total_steps": 2724, "loss": 0.3805, "learning_rate": 5e-06, "epoch": 2.476609796367639, "percentage": 82.6, "elapsed_time": "5:20:11", "remaining_time": "1:07:27"}
{"current_steps": 2260, "total_steps": 2724, "loss": 0.3805, "learning_rate": 5e-06, "epoch": 2.487616951018162, "percentage": 82.97, "elapsed_time": "5:21:34", "remaining_time": "1:06:01"}
{"current_steps": 2270, "total_steps": 2724, "loss": 0.3779, "learning_rate": 5e-06, "epoch": 2.498624105668685, "percentage": 83.33, "elapsed_time": "5:22:57", "remaining_time": "1:04:35"}
{"current_steps": 2280, "total_steps": 2724, "loss": 0.3818, "learning_rate": 5e-06, "epoch": 2.5096312603192077, "percentage": 83.7, "elapsed_time": "5:24:20", "remaining_time": "1:03:09"}
{"current_steps": 2290, "total_steps": 2724, "loss": 0.3774, "learning_rate": 5e-06, "epoch": 2.5206384149697305, "percentage": 84.07, "elapsed_time": "5:25:44", "remaining_time": "1:01:44"}
{"current_steps": 2300, "total_steps": 2724, "loss": 0.3787, "learning_rate": 5e-06, "epoch": 2.5316455696202533, "percentage": 84.43, "elapsed_time": "5:27:07", "remaining_time": "1:00:18"}
{"current_steps": 2310, "total_steps": 2724, "loss": 0.3826, "learning_rate": 5e-06, "epoch": 2.542652724270776, "percentage": 84.8, "elapsed_time": "5:28:30", "remaining_time": "0:58:52"}
{"current_steps": 2320, "total_steps": 2724, "loss": 0.3825, "learning_rate": 5e-06, "epoch": 2.553659878921299, "percentage": 85.17, "elapsed_time": "5:29:54", "remaining_time": "0:57:27"}
{"current_steps": 2330, "total_steps": 2724, "loss": 0.3794, "learning_rate": 5e-06, "epoch": 2.564667033571822, "percentage": 85.54, "elapsed_time": "5:31:18", "remaining_time": "0:56:01"}
{"current_steps": 2340, "total_steps": 2724, "loss": 0.38, "learning_rate": 5e-06, "epoch": 2.5756741882223446, "percentage": 85.9, "elapsed_time": "5:32:42", "remaining_time": "0:54:35"}
{"current_steps": 2350, "total_steps": 2724, "loss": 0.3782, "learning_rate": 5e-06, "epoch": 2.5866813428728674, "percentage": 86.27, "elapsed_time": "5:34:05", "remaining_time": "0:53:10"}
{"current_steps": 2360, "total_steps": 2724, "loss": 0.3839, "learning_rate": 5e-06, "epoch": 2.5976884975233903, "percentage": 86.64, "elapsed_time": "5:35:28", "remaining_time": "0:51:44"}
{"current_steps": 2370, "total_steps": 2724, "loss": 0.3834, "learning_rate": 5e-06, "epoch": 2.608695652173913, "percentage": 87.0, "elapsed_time": "5:36:51", "remaining_time": "0:50:18"}
{"current_steps": 2380, "total_steps": 2724, "loss": 0.3768, "learning_rate": 5e-06, "epoch": 2.619702806824436, "percentage": 87.37, "elapsed_time": "5:38:14", "remaining_time": "0:48:53"}
{"current_steps": 2390, "total_steps": 2724, "loss": 0.3809, "learning_rate": 5e-06, "epoch": 2.6307099614749587, "percentage": 87.74, "elapsed_time": "5:39:38", "remaining_time": "0:47:27"}
{"current_steps": 2400, "total_steps": 2724, "loss": 0.379, "learning_rate": 5e-06, "epoch": 2.6417171161254815, "percentage": 88.11, "elapsed_time": "5:41:01", "remaining_time": "0:46:02"}
{"current_steps": 2410, "total_steps": 2724, "loss": 0.3794, "learning_rate": 5e-06, "epoch": 2.6527242707760044, "percentage": 88.47, "elapsed_time": "5:42:24", "remaining_time": "0:44:36"}
{"current_steps": 2420, "total_steps": 2724, "loss": 0.3776, "learning_rate": 5e-06, "epoch": 2.663731425426527, "percentage": 88.84, "elapsed_time": "5:43:46", "remaining_time": "0:43:11"}
{"current_steps": 2430, "total_steps": 2724, "loss": 0.3809, "learning_rate": 5e-06, "epoch": 2.67473858007705, "percentage": 89.21, "elapsed_time": "5:45:10", "remaining_time": "0:41:45"}
{"current_steps": 2440, "total_steps": 2724, "loss": 0.379, "learning_rate": 5e-06, "epoch": 2.685745734727573, "percentage": 89.57, "elapsed_time": "5:46:33", "remaining_time": "0:40:20"}
{"current_steps": 2450, "total_steps": 2724, "loss": 0.3777, "learning_rate": 5e-06, "epoch": 2.6967528893780957, "percentage": 89.94, "elapsed_time": "5:47:56", "remaining_time": "0:38:54"}
{"current_steps": 2460, "total_steps": 2724, "loss": 0.381, "learning_rate": 5e-06, "epoch": 2.7077600440286185, "percentage": 90.31, "elapsed_time": "5:49:19", "remaining_time": "0:37:29"}
{"current_steps": 2470, "total_steps": 2724, "loss": 0.3829, "learning_rate": 5e-06, "epoch": 2.7187671986791413, "percentage": 90.68, "elapsed_time": "5:50:43", "remaining_time": "0:36:03"}
{"current_steps": 2480, "total_steps": 2724, "loss": 0.3798, "learning_rate": 5e-06, "epoch": 2.729774353329664, "percentage": 91.04, "elapsed_time": "5:52:06", "remaining_time": "0:34:38"}
{"current_steps": 2490, "total_steps": 2724, "loss": 0.3803, "learning_rate": 5e-06, "epoch": 2.740781507980187, "percentage": 91.41, "elapsed_time": "5:53:29", "remaining_time": "0:33:13"}
{"current_steps": 2500, "total_steps": 2724, "loss": 0.3836, "learning_rate": 5e-06, "epoch": 2.7517886626307098, "percentage": 91.78, "elapsed_time": "5:54:53", "remaining_time": "0:31:47"}
{"current_steps": 2510, "total_steps": 2724, "loss": 0.3771, "learning_rate": 5e-06, "epoch": 2.7627958172812326, "percentage": 92.14, "elapsed_time": "5:56:17", "remaining_time": "0:30:22"}
{"current_steps": 2520, "total_steps": 2724, "loss": 0.3832, "learning_rate": 5e-06, "epoch": 2.7738029719317554, "percentage": 92.51, "elapsed_time": "5:57:41", "remaining_time": "0:28:57"}
{"current_steps": 2530, "total_steps": 2724, "loss": 0.3758, "learning_rate": 5e-06, "epoch": 2.7848101265822782, "percentage": 92.88, "elapsed_time": "5:59:05", "remaining_time": "0:27:32"}
{"current_steps": 2540, "total_steps": 2724, "loss": 0.3846, "learning_rate": 5e-06, "epoch": 2.795817281232801, "percentage": 93.25, "elapsed_time": "6:00:28", "remaining_time": "0:26:06"}
{"current_steps": 2550, "total_steps": 2724, "loss": 0.3805, "learning_rate": 5e-06, "epoch": 2.8068244358833243, "percentage": 93.61, "elapsed_time": "6:01:51", "remaining_time": "0:24:41"}
{"current_steps": 2560, "total_steps": 2724, "loss": 0.3814, "learning_rate": 5e-06, "epoch": 2.817831590533847, "percentage": 93.98, "elapsed_time": "6:03:15", "remaining_time": "0:23:16"}
{"current_steps": 2570, "total_steps": 2724, "loss": 0.3833, "learning_rate": 5e-06, "epoch": 2.82883874518437, "percentage": 94.35, "elapsed_time": "6:04:39", "remaining_time": "0:21:51"}
{"current_steps": 2580, "total_steps": 2724, "loss": 0.3785, "learning_rate": 5e-06, "epoch": 2.8398458998348928, "percentage": 94.71, "elapsed_time": "6:06:02", "remaining_time": "0:20:25"}
{"current_steps": 2590, "total_steps": 2724, "loss": 0.3791, "learning_rate": 5e-06, "epoch": 2.8508530544854156, "percentage": 95.08, "elapsed_time": "6:07:26", "remaining_time": "0:19:00"}
{"current_steps": 2600, "total_steps": 2724, "loss": 0.3771, "learning_rate": 5e-06, "epoch": 2.8618602091359384, "percentage": 95.45, "elapsed_time": "6:08:49", "remaining_time": "0:17:35"}
{"current_steps": 2610, "total_steps": 2724, "loss": 0.3814, "learning_rate": 5e-06, "epoch": 2.8728673637864612, "percentage": 95.81, "elapsed_time": "6:10:13", "remaining_time": "0:16:10"}
{"current_steps": 2620, "total_steps": 2724, "loss": 0.3879, "learning_rate": 5e-06, "epoch": 2.883874518436984, "percentage": 96.18, "elapsed_time": "6:11:36", "remaining_time": "0:14:45"}
{"current_steps": 2630, "total_steps": 2724, "loss": 0.3756, "learning_rate": 5e-06, "epoch": 2.894881673087507, "percentage": 96.55, "elapsed_time": "6:13:00", "remaining_time": "0:13:19"}
{"current_steps": 2640, "total_steps": 2724, "loss": 0.3791, "learning_rate": 5e-06, "epoch": 2.9058888277380297, "percentage": 96.92, "elapsed_time": "6:14:23", "remaining_time": "0:11:54"}
{"current_steps": 2650, "total_steps": 2724, "loss": 0.383, "learning_rate": 5e-06, "epoch": 2.9168959823885525, "percentage": 97.28, "elapsed_time": "6:15:46", "remaining_time": "0:10:29"}
{"current_steps": 2660, "total_steps": 2724, "loss": 0.3838, "learning_rate": 5e-06, "epoch": 2.9279031370390753, "percentage": 97.65, "elapsed_time": "6:17:10", "remaining_time": "0:09:04"}
{"current_steps": 2670, "total_steps": 2724, "loss": 0.3805, "learning_rate": 5e-06, "epoch": 2.938910291689598, "percentage": 98.02, "elapsed_time": "6:18:33", "remaining_time": "0:07:39"}
{"current_steps": 2680, "total_steps": 2724, "loss": 0.379, "learning_rate": 5e-06, "epoch": 2.949917446340121, "percentage": 98.38, "elapsed_time": "6:19:56", "remaining_time": "0:06:14"}
{"current_steps": 2690, "total_steps": 2724, "loss": 0.3779, "learning_rate": 5e-06, "epoch": 2.960924600990644, "percentage": 98.75, "elapsed_time": "6:21:19", "remaining_time": "0:04:49"}
{"current_steps": 2700, "total_steps": 2724, "loss": 0.3791, "learning_rate": 5e-06, "epoch": 2.9719317556411666, "percentage": 99.12, "elapsed_time": "6:22:43", "remaining_time": "0:03:24"}
{"current_steps": 2710, "total_steps": 2724, "loss": 0.377, "learning_rate": 5e-06, "epoch": 2.9829389102916894, "percentage": 99.49, "elapsed_time": "6:24:06", "remaining_time": "0:01:59"}
{"current_steps": 2720, "total_steps": 2724, "loss": 0.3803, "learning_rate": 5e-06, "epoch": 2.9939460649422127, "percentage": 99.85, "elapsed_time": "6:25:30", "remaining_time": "0:00:34"}
|