{"current_steps": 10, "total_steps": 12855, "loss": 0.9946, "accuracy": 0.6000000238418579, "learning_rate": 4.9999925343886e-05, "epoch": 0.0007779074290159471, "percentage": 0.08, "elapsed_time": "0:00:11", "remaining_time": "4:10:13", "throughput": 1051.3, "total_tokens": 12288} {"current_steps": 20, "total_steps": 12855, "loss": 1.2427, "accuracy": 0.699999988079071, "learning_rate": 4.999970137598988e-05, "epoch": 0.0015558148580318942, "percentage": 0.16, "elapsed_time": "0:00:20", "remaining_time": "3:37:55", "throughput": 1282.36, "total_tokens": 26128} {"current_steps": 30, "total_steps": 12855, "loss": 1.2893, "accuracy": 0.5, "learning_rate": 4.999932809764929e-05, "epoch": 0.002333722287047841, "percentage": 0.23, "elapsed_time": "0:00:29", "remaining_time": "3:33:19", "throughput": 1385.67, "total_tokens": 41488} {"current_steps": 40, "total_steps": 12855, "loss": 1.2549, "accuracy": 0.20000000298023224, "learning_rate": 4.999880551109363e-05, "epoch": 0.0031116297160637884, "percentage": 0.31, "elapsed_time": "0:00:37", "remaining_time": "3:22:34", "throughput": 1414.48, "total_tokens": 53664} {"current_steps": 50, "total_steps": 12855, "loss": 0.7365, "accuracy": 1.0, "learning_rate": 4.999813361944403e-05, "epoch": 0.0038895371450797353, "percentage": 0.39, "elapsed_time": "0:00:45", "remaining_time": "3:12:46", "throughput": 1388.05, "total_tokens": 62688} {"current_steps": 60, "total_steps": 12855, "loss": 0.8873, "accuracy": 0.5, "learning_rate": 4.9997312426713375e-05, "epoch": 0.004667444574095682, "percentage": 0.47, "elapsed_time": "0:00:53", "remaining_time": "3:11:31", "throughput": 1414.54, "total_tokens": 76224} {"current_steps": 70, "total_steps": 12855, "loss": 1.1815, "accuracy": 0.699999988079071, "learning_rate": 4.9996341937806215e-05, "epoch": 0.0054453520031116295, "percentage": 0.54, "elapsed_time": "0:01:01", "remaining_time": "3:05:53", "throughput": 1401.75, "total_tokens": 85600} {"current_steps": 80, "total_steps": 12855, "loss": 1.3283, "accuracy": 0.6000000238418579, "learning_rate": 4.999522215851879e-05, "epoch": 0.006223259432127577, "percentage": 0.62, "elapsed_time": "0:01:09", "remaining_time": "3:05:34", "throughput": 1419.0, "total_tokens": 98944} {"current_steps": 90, "total_steps": 12855, "loss": 0.9855, "accuracy": 0.5, "learning_rate": 4.999395309553898e-05, "epoch": 0.007001166861143524, "percentage": 0.7, "elapsed_time": "0:01:18", "remaining_time": "3:04:31", "throughput": 1435.19, "total_tokens": 112032} {"current_steps": 100, "total_steps": 12855, "loss": 0.8797, "accuracy": 0.699999988079071, "learning_rate": 4.999253475644623e-05, "epoch": 0.007779074290159471, "percentage": 0.78, "elapsed_time": "0:01:25", "remaining_time": "3:02:13", "throughput": 1439.83, "total_tokens": 123424} {"current_steps": 110, "total_steps": 12855, "loss": 1.2075, "accuracy": 0.4000000059604645, "learning_rate": 4.999096714971156e-05, "epoch": 0.008556981719175419, "percentage": 0.86, "elapsed_time": "0:01:34", "remaining_time": "3:02:48", "throughput": 1461.94, "total_tokens": 138400} {"current_steps": 120, "total_steps": 12855, "loss": 0.8176, "accuracy": 0.699999988079071, "learning_rate": 4.99892502846975e-05, "epoch": 0.009334889148191364, "percentage": 0.93, "elapsed_time": "0:01:44", "remaining_time": "3:04:06", "throughput": 1473.29, "total_tokens": 153360} {"current_steps": 130, "total_steps": 12855, "loss": 1.0001, "accuracy": 0.6000000238418579, "learning_rate": 4.9987384171657994e-05, "epoch": 0.010112796577207312, "percentage": 1.01, "elapsed_time": "0:01:51", "remaining_time": "3:02:37", "throughput": 1474.67, "total_tokens": 165072} {"current_steps": 140, "total_steps": 12855, "loss": 0.8903, "accuracy": 0.8999999761581421, "learning_rate": 4.9985368821738385e-05, "epoch": 0.010890704006223259, "percentage": 1.09, "elapsed_time": "0:01:59", "remaining_time": "3:01:10", "throughput": 1468.96, "total_tokens": 175824} {"current_steps": 150, "total_steps": 12855, "loss": 0.9588, "accuracy": 0.699999988079071, "learning_rate": 4.998320424697532e-05, "epoch": 0.011668611435239206, "percentage": 1.17, "elapsed_time": "0:02:06", "remaining_time": "2:59:13", "throughput": 1467.53, "total_tokens": 186320} {"current_steps": 160, "total_steps": 12855, "loss": 0.9697, "accuracy": 0.6000000238418579, "learning_rate": 4.998089046029671e-05, "epoch": 0.012446518864255154, "percentage": 1.24, "elapsed_time": "0:02:16", "remaining_time": "3:01:02", "throughput": 1483.26, "total_tokens": 203072} {"current_steps": 170, "total_steps": 12855, "loss": 0.9788, "accuracy": 0.699999988079071, "learning_rate": 4.9978427475521616e-05, "epoch": 0.013224426293271101, "percentage": 1.32, "elapsed_time": "0:02:24", "remaining_time": "2:59:31", "throughput": 1484.83, "total_tokens": 214336} {"current_steps": 180, "total_steps": 12855, "loss": 0.8951, "accuracy": 0.6000000238418579, "learning_rate": 4.9975815307360194e-05, "epoch": 0.014002333722287048, "percentage": 1.4, "elapsed_time": "0:02:46", "remaining_time": "3:15:24", "throughput": 1395.54, "total_tokens": 232368} {"current_steps": 190, "total_steps": 12855, "loss": 0.9661, "accuracy": 0.800000011920929, "learning_rate": 4.997305397141357e-05, "epoch": 0.014780241151302996, "percentage": 1.48, "elapsed_time": "0:02:54", "remaining_time": "3:14:05", "throughput": 1390.69, "total_tokens": 242960} {"current_steps": 200, "total_steps": 12855, "loss": 0.9529, "accuracy": 0.6000000238418579, "learning_rate": 4.997014348417382e-05, "epoch": 0.015558148580318941, "percentage": 1.56, "elapsed_time": "0:03:04", "remaining_time": "3:14:34", "throughput": 1398.82, "total_tokens": 258080} {"current_steps": 210, "total_steps": 12855, "loss": 1.2197, "accuracy": 0.8999999761581421, "learning_rate": 4.9967083863023776e-05, "epoch": 0.01633605600933489, "percentage": 1.63, "elapsed_time": "0:03:14", "remaining_time": "3:14:43", "throughput": 1401.38, "total_tokens": 271920} {"current_steps": 220, "total_steps": 12855, "loss": 0.8338, "accuracy": 0.699999988079071, "learning_rate": 4.9963875126237016e-05, "epoch": 0.017113963438350838, "percentage": 1.71, "elapsed_time": "0:03:47", "remaining_time": "3:37:43", "throughput": 1259.87, "total_tokens": 286576} {"current_steps": 230, "total_steps": 12855, "loss": 1.2993, "accuracy": 0.6000000238418579, "learning_rate": 4.9960517292977655e-05, "epoch": 0.017891870867366783, "percentage": 1.79, "elapsed_time": "0:03:55", "remaining_time": "3:35:10", "throughput": 1262.32, "total_tokens": 296896} {"current_steps": 240, "total_steps": 12855, "loss": 1.0844, "accuracy": 0.4000000059604645, "learning_rate": 4.995701038330033e-05, "epoch": 0.01866977829638273, "percentage": 1.87, "elapsed_time": "0:04:04", "remaining_time": "3:34:23", "throughput": 1272.0, "total_tokens": 311296} {"current_steps": 250, "total_steps": 12855, "loss": 1.2243, "accuracy": 0.5, "learning_rate": 4.995335441815003e-05, "epoch": 0.019447685725398678, "percentage": 1.94, "elapsed_time": "0:04:12", "remaining_time": "3:31:51", "throughput": 1273.96, "total_tokens": 321184} {"current_steps": 260, "total_steps": 12855, "loss": 1.0084, "accuracy": 0.6000000238418579, "learning_rate": 4.9949549419361954e-05, "epoch": 0.020225593154414623, "percentage": 2.02, "elapsed_time": "0:04:20", "remaining_time": "3:30:13", "throughput": 1272.5, "total_tokens": 331328} {"current_steps": 270, "total_steps": 12855, "loss": 1.0466, "accuracy": 0.6000000238418579, "learning_rate": 4.994559540966142e-05, "epoch": 0.021003500583430573, "percentage": 2.1, "elapsed_time": "0:04:35", "remaining_time": "3:33:47", "throughput": 1255.32, "total_tokens": 345456} {"current_steps": 280, "total_steps": 12855, "loss": 1.0896, "accuracy": 0.4000000059604645, "learning_rate": 4.994149241266371e-05, "epoch": 0.021781408012446518, "percentage": 2.18, "elapsed_time": "0:04:43", "remaining_time": "3:32:23", "throughput": 1260.13, "total_tokens": 357568} {"current_steps": 290, "total_steps": 12855, "loss": 0.9888, "accuracy": 0.699999988079071, "learning_rate": 4.993724045287392e-05, "epoch": 0.022559315441462467, "percentage": 2.26, "elapsed_time": "0:04:53", "remaining_time": "3:31:45", "throughput": 1273.63, "total_tokens": 373472} {"current_steps": 300, "total_steps": 12855, "loss": 0.9519, "accuracy": 0.6000000238418579, "learning_rate": 4.993283955568685e-05, "epoch": 0.023337222870478413, "percentage": 2.33, "elapsed_time": "0:05:01", "remaining_time": "3:30:16", "throughput": 1280.63, "total_tokens": 386080} {"current_steps": 310, "total_steps": 12855, "loss": 0.961, "accuracy": 0.699999988079071, "learning_rate": 4.99282897473868e-05, "epoch": 0.024115130299494362, "percentage": 2.41, "elapsed_time": "0:05:09", "remaining_time": "3:28:38", "throughput": 1281.34, "total_tokens": 396368} {"current_steps": 320, "total_steps": 12855, "loss": 1.1594, "accuracy": 0.6000000238418579, "learning_rate": 4.9923591055147455e-05, "epoch": 0.024893037728510307, "percentage": 2.49, "elapsed_time": "0:05:21", "remaining_time": "3:29:39", "throughput": 1290.37, "total_tokens": 414368} {"current_steps": 330, "total_steps": 12855, "loss": 0.9619, "accuracy": 0.6000000238418579, "learning_rate": 4.99187435070317e-05, "epoch": 0.025670945157526253, "percentage": 2.57, "elapsed_time": "0:05:29", "remaining_time": "3:28:19", "throughput": 1289.87, "total_tokens": 424800} {"current_steps": 340, "total_steps": 12855, "loss": 1.1314, "accuracy": 0.699999988079071, "learning_rate": 4.991374713199145e-05, "epoch": 0.026448852586542202, "percentage": 2.64, "elapsed_time": "0:05:37", "remaining_time": "3:26:56", "throughput": 1292.5, "total_tokens": 435984} {"current_steps": 350, "total_steps": 12855, "loss": 1.2046, "accuracy": 0.6000000238418579, "learning_rate": 4.990860195986753e-05, "epoch": 0.027226760015558148, "percentage": 2.72, "elapsed_time": "0:05:46", "remaining_time": "3:26:05", "throughput": 1297.69, "total_tokens": 449136} {"current_steps": 360, "total_steps": 12855, "loss": 0.8601, "accuracy": 0.6000000238418579, "learning_rate": 4.990330802138941e-05, "epoch": 0.028004667444574097, "percentage": 2.8, "elapsed_time": "0:05:54", "remaining_time": "3:25:08", "throughput": 1301.95, "total_tokens": 461712} {"current_steps": 370, "total_steps": 12855, "loss": 0.9149, "accuracy": 0.699999988079071, "learning_rate": 4.989786534817507e-05, "epoch": 0.028782574873590042, "percentage": 2.88, "elapsed_time": "0:06:01", "remaining_time": "3:23:30", "throughput": 1302.52, "total_tokens": 471328} {"current_steps": 380, "total_steps": 12855, "loss": 1.0315, "accuracy": 0.5, "learning_rate": 4.989227397273082e-05, "epoch": 0.02956048230260599, "percentage": 2.96, "elapsed_time": "0:06:09", "remaining_time": "3:22:09", "throughput": 1303.77, "total_tokens": 481728} {"current_steps": 390, "total_steps": 12855, "loss": 1.1379, "accuracy": 0.5, "learning_rate": 4.9886533928451104e-05, "epoch": 0.030338389731621937, "percentage": 3.03, "elapsed_time": "0:06:16", "remaining_time": "3:20:49", "throughput": 1304.7, "total_tokens": 491856} {"current_steps": 400, "total_steps": 12855, "loss": 0.9889, "accuracy": 0.800000011920929, "learning_rate": 4.9880645249618266e-05, "epoch": 0.031116297160637883, "percentage": 3.11, "elapsed_time": "0:06:25", "remaining_time": "3:19:57", "throughput": 1308.23, "total_tokens": 504080} {"current_steps": 410, "total_steps": 12855, "loss": 1.1025, "accuracy": 0.6000000238418579, "learning_rate": 4.9874607971402366e-05, "epoch": 0.03189420458965383, "percentage": 3.19, "elapsed_time": "0:06:34", "remaining_time": "3:19:38", "throughput": 1314.37, "total_tokens": 518688} {"current_steps": 420, "total_steps": 12855, "loss": 1.0915, "accuracy": 0.5, "learning_rate": 4.986842212986099e-05, "epoch": 0.03267211201866978, "percentage": 3.27, "elapsed_time": "0:06:43", "remaining_time": "3:19:13", "throughput": 1317.45, "total_tokens": 531904} {"current_steps": 430, "total_steps": 12855, "loss": 1.0653, "accuracy": 0.800000011920929, "learning_rate": 4.986208776193902e-05, "epoch": 0.033450019447685726, "percentage": 3.35, "elapsed_time": "0:06:52", "remaining_time": "3:18:28", "throughput": 1321.11, "total_tokens": 544448} {"current_steps": 440, "total_steps": 12855, "loss": 0.9403, "accuracy": 0.699999988079071, "learning_rate": 4.985560490546839e-05, "epoch": 0.034227926876701675, "percentage": 3.42, "elapsed_time": "0:07:27", "remaining_time": "3:30:16", "throughput": 1249.23, "total_tokens": 558576} {"current_steps": 450, "total_steps": 12855, "loss": 0.8978, "accuracy": 0.699999988079071, "learning_rate": 4.984897359916788e-05, "epoch": 0.03500583430571762, "percentage": 3.5, "elapsed_time": "0:07:34", "remaining_time": "3:28:46", "throughput": 1249.02, "total_tokens": 567568} {"current_steps": 460, "total_steps": 12855, "loss": 1.3919, "accuracy": 0.4000000059604645, "learning_rate": 4.9842193882642906e-05, "epoch": 0.035783741734733567, "percentage": 3.58, "elapsed_time": "0:07:43", "remaining_time": "3:27:57", "throughput": 1256.07, "total_tokens": 581632} {"current_steps": 470, "total_steps": 12855, "loss": 1.163, "accuracy": 0.5, "learning_rate": 4.9835265796385254e-05, "epoch": 0.036561649163749516, "percentage": 3.66, "elapsed_time": "0:07:50", "remaining_time": "3:26:47", "throughput": 1263.51, "total_tokens": 594912} {"current_steps": 480, "total_steps": 12855, "loss": 1.1806, "accuracy": 0.699999988079071, "learning_rate": 4.982818938177284e-05, "epoch": 0.03733955659276546, "percentage": 3.73, "elapsed_time": "0:07:58", "remaining_time": "3:25:31", "throughput": 1270.76, "total_tokens": 607808} {"current_steps": 490, "total_steps": 12855, "loss": 1.1041, "accuracy": 0.6000000238418579, "learning_rate": 4.982096468106947e-05, "epoch": 0.03811746402178141, "percentage": 3.81, "elapsed_time": "0:08:12", "remaining_time": "3:27:18", "throughput": 1269.93, "total_tokens": 625984} {"current_steps": 500, "total_steps": 12855, "loss": 0.9547, "accuracy": 0.6000000238418579, "learning_rate": 4.9813591737424596e-05, "epoch": 0.038895371450797356, "percentage": 3.89, "elapsed_time": "0:08:22", "remaining_time": "3:26:49", "throughput": 1274.05, "total_tokens": 639856} {"current_steps": 510, "total_steps": 12855, "loss": 0.9541, "accuracy": 1.0, "learning_rate": 4.9806070594873037e-05, "epoch": 0.039673278879813305, "percentage": 3.97, "elapsed_time": "0:08:31", "remaining_time": "3:26:28", "throughput": 1271.27, "total_tokens": 650656} {"current_steps": 520, "total_steps": 12855, "loss": 1.1046, "accuracy": 0.6000000238418579, "learning_rate": 4.979840129833474e-05, "epoch": 0.04045118630882925, "percentage": 4.05, "elapsed_time": "0:08:40", "remaining_time": "3:25:36", "throughput": 1272.02, "total_tokens": 661552} {"current_steps": 530, "total_steps": 12855, "loss": 1.043, "accuracy": 0.699999988079071, "learning_rate": 4.97905838936145e-05, "epoch": 0.041229093737845196, "percentage": 4.12, "elapsed_time": "0:08:48", "remaining_time": "3:24:56", "throughput": 1278.27, "total_tokens": 675936} {"current_steps": 540, "total_steps": 12855, "loss": 1.1117, "accuracy": 0.800000011920929, "learning_rate": 4.978261842740166e-05, "epoch": 0.042007001166861145, "percentage": 4.2, "elapsed_time": "0:08:58", "remaining_time": "3:24:37", "throughput": 1281.86, "total_tokens": 690112} {"current_steps": 550, "total_steps": 12855, "loss": 1.0439, "accuracy": 0.5, "learning_rate": 4.9774504947269905e-05, "epoch": 0.04278490859587709, "percentage": 4.28, "elapsed_time": "0:09:07", "remaining_time": "3:24:02", "throughput": 1287.41, "total_tokens": 704480} {"current_steps": 560, "total_steps": 12855, "loss": 0.8628, "accuracy": 0.8999999761581421, "learning_rate": 4.97662435016769e-05, "epoch": 0.043562816024893036, "percentage": 4.36, "elapsed_time": "0:09:16", "remaining_time": "3:23:47", "throughput": 1293.77, "total_tokens": 720512} {"current_steps": 570, "total_steps": 12855, "loss": 1.0203, "accuracy": 0.5, "learning_rate": 4.9757834139964035e-05, "epoch": 0.044340723453908985, "percentage": 4.43, "elapsed_time": "0:09:25", "remaining_time": "3:23:06", "throughput": 1294.27, "total_tokens": 731840} {"current_steps": 580, "total_steps": 12855, "loss": 0.9147, "accuracy": 0.699999988079071, "learning_rate": 4.974927691235614e-05, "epoch": 0.045118630882924934, "percentage": 4.51, "elapsed_time": "0:09:33", "remaining_time": "3:22:18", "throughput": 1295.08, "total_tokens": 742800} {"current_steps": 590, "total_steps": 12855, "loss": 1.293, "accuracy": 0.6000000238418579, "learning_rate": 4.9740571869961137e-05, "epoch": 0.045896538311940877, "percentage": 4.59, "elapsed_time": "0:09:42", "remaining_time": "3:21:41", "throughput": 1291.87, "total_tokens": 752016} {"current_steps": 600, "total_steps": 12855, "loss": 0.8797, "accuracy": 0.800000011920929, "learning_rate": 4.9731719064769833e-05, "epoch": 0.046674445740956826, "percentage": 4.67, "elapsed_time": "0:09:51", "remaining_time": "3:21:13", "throughput": 1291.4, "total_tokens": 763376} {"current_steps": 610, "total_steps": 12855, "loss": 0.9802, "accuracy": 0.800000011920929, "learning_rate": 4.972271854965549e-05, "epoch": 0.047452353169972775, "percentage": 4.75, "elapsed_time": "0:10:00", "remaining_time": "3:20:58", "throughput": 1290.83, "total_tokens": 775424} {"current_steps": 620, "total_steps": 12855, "loss": 1.0053, "accuracy": 0.699999988079071, "learning_rate": 4.9713570378373584e-05, "epoch": 0.048230260598988724, "percentage": 4.82, "elapsed_time": "0:10:14", "remaining_time": "3:22:10", "throughput": 1288.73, "total_tokens": 792192} {"current_steps": 630, "total_steps": 12855, "loss": 0.9485, "accuracy": 0.6000000238418579, "learning_rate": 4.9704274605561486e-05, "epoch": 0.049008168028004666, "percentage": 4.9, "elapsed_time": "0:10:25", "remaining_time": "3:22:08", "throughput": 1286.24, "total_tokens": 803920} {"current_steps": 640, "total_steps": 12855, "loss": 0.9619, "accuracy": 0.6000000238418579, "learning_rate": 4.969483128673808e-05, "epoch": 0.049786075457020615, "percentage": 4.98, "elapsed_time": "0:10:36", "remaining_time": "3:22:25", "throughput": 1285.25, "total_tokens": 817856} {"current_steps": 650, "total_steps": 12855, "loss": 1.1217, "accuracy": 0.6000000238418579, "learning_rate": 4.96852404783035e-05, "epoch": 0.050563982886036564, "percentage": 5.06, "elapsed_time": "0:10:48", "remaining_time": "3:22:49", "throughput": 1289.09, "total_tokens": 835488} {"current_steps": 660, "total_steps": 12855, "loss": 1.3282, "accuracy": 0.6000000238418579, "learning_rate": 4.967550223753873e-05, "epoch": 0.051341890315052506, "percentage": 5.13, "elapsed_time": "0:11:00", "remaining_time": "3:23:19", "throughput": 1290.9, "total_tokens": 852288} {"current_steps": 670, "total_steps": 12855, "loss": 0.9846, "accuracy": 0.699999988079071, "learning_rate": 4.966561662260532e-05, "epoch": 0.052119797744068455, "percentage": 5.21, "elapsed_time": "0:11:07", "remaining_time": "3:22:23", "throughput": 1290.91, "total_tokens": 861984} {"current_steps": 680, "total_steps": 12855, "loss": 0.9382, "accuracy": 0.800000011920929, "learning_rate": 4.9655583692544986e-05, "epoch": 0.052897705173084404, "percentage": 5.29, "elapsed_time": "0:11:18", "remaining_time": "3:22:21", "throughput": 1291.01, "total_tokens": 875440} {"current_steps": 690, "total_steps": 12855, "loss": 1.1782, "accuracy": 0.8999999761581421, "learning_rate": 4.96454035072793e-05, "epoch": 0.05367561260210035, "percentage": 5.37, "elapsed_time": "0:11:28", "remaining_time": "3:22:12", "throughput": 1294.63, "total_tokens": 890912} {"current_steps": 700, "total_steps": 12855, "loss": 1.1765, "accuracy": 0.800000011920929, "learning_rate": 4.963507612760932e-05, "epoch": 0.054453520031116295, "percentage": 5.45, "elapsed_time": "0:11:38", "remaining_time": "3:22:00", "throughput": 1298.62, "total_tokens": 906464} {"current_steps": 710, "total_steps": 12855, "loss": 1.659, "accuracy": 0.6000000238418579, "learning_rate": 4.962460161521518e-05, "epoch": 0.055231427460132244, "percentage": 5.52, "elapsed_time": "0:11:46", "remaining_time": "3:21:32", "throughput": 1300.91, "total_tokens": 919648} {"current_steps": 720, "total_steps": 12855, "loss": 0.9826, "accuracy": 0.4000000059604645, "learning_rate": 4.961398003265582e-05, "epoch": 0.056009334889148193, "percentage": 5.6, "elapsed_time": "0:11:55", "remaining_time": "3:21:06", "throughput": 1302.01, "total_tokens": 932144} {"current_steps": 730, "total_steps": 12855, "loss": 1.1655, "accuracy": 0.6000000238418579, "learning_rate": 4.96032114433685e-05, "epoch": 0.056787242318164136, "percentage": 5.68, "elapsed_time": "0:12:04", "remaining_time": "3:20:28", "throughput": 1304.07, "total_tokens": 944384} {"current_steps": 740, "total_steps": 12855, "loss": 0.9084, "accuracy": 0.800000011920929, "learning_rate": 4.9592295911668516e-05, "epoch": 0.057565149747180085, "percentage": 5.76, "elapsed_time": "0:12:13", "remaining_time": "3:20:01", "throughput": 1304.82, "total_tokens": 956528} {"current_steps": 750, "total_steps": 12855, "loss": 0.8905, "accuracy": 0.5, "learning_rate": 4.958123350274878e-05, "epoch": 0.058343057176196034, "percentage": 5.83, "elapsed_time": "0:12:23", "remaining_time": "3:20:08", "throughput": 1307.9, "total_tokens": 973072} {"current_steps": 760, "total_steps": 12855, "loss": 1.0587, "accuracy": 0.699999988079071, "learning_rate": 4.957002428267937e-05, "epoch": 0.05912096460521198, "percentage": 5.91, "elapsed_time": "0:12:34", "remaining_time": "3:20:09", "throughput": 1312.44, "total_tokens": 990416} {"current_steps": 770, "total_steps": 12855, "loss": 0.8686, "accuracy": 0.699999988079071, "learning_rate": 4.9558668318407264e-05, "epoch": 0.059898872034227925, "percentage": 5.99, "elapsed_time": "0:12:42", "remaining_time": "3:19:30", "throughput": 1312.14, "total_tokens": 1000784} {"current_steps": 780, "total_steps": 12855, "loss": 1.0232, "accuracy": 0.6000000238418579, "learning_rate": 4.954716567775582e-05, "epoch": 0.060676779463243874, "percentage": 6.07, "elapsed_time": "0:12:55", "remaining_time": "3:20:11", "throughput": 1310.78, "total_tokens": 1016992} {"current_steps": 790, "total_steps": 12855, "loss": 0.8984, "accuracy": 0.8999999761581421, "learning_rate": 4.9535516429424444e-05, "epoch": 0.06145468689225982, "percentage": 6.15, "elapsed_time": "0:13:03", "remaining_time": "3:19:25", "throughput": 1310.91, "total_tokens": 1027120} {"current_steps": 800, "total_steps": 12855, "loss": 1.0546, "accuracy": 0.4000000059604645, "learning_rate": 4.952372064298813e-05, "epoch": 0.062232594321275765, "percentage": 6.22, "elapsed_time": "0:13:12", "remaining_time": "3:19:01", "throughput": 1312.59, "total_tokens": 1040192} {"current_steps": 810, "total_steps": 12855, "loss": 0.9553, "accuracy": 0.5, "learning_rate": 4.9511778388897094e-05, "epoch": 0.06301050175029171, "percentage": 6.3, "elapsed_time": "0:13:22", "remaining_time": "3:18:49", "throughput": 1314.04, "total_tokens": 1054160} {"current_steps": 820, "total_steps": 12855, "loss": 1.124, "accuracy": 0.699999988079071, "learning_rate": 4.949968973847632e-05, "epoch": 0.06378840917930766, "percentage": 6.38, "elapsed_time": "0:13:31", "remaining_time": "3:18:32", "throughput": 1315.31, "total_tokens": 1067616} {"current_steps": 830, "total_steps": 12855, "loss": 0.9705, "accuracy": 0.699999988079071, "learning_rate": 4.9487454763925135e-05, "epoch": 0.06456631660832361, "percentage": 6.46, "elapsed_time": "0:13:44", "remaining_time": "3:19:06", "throughput": 1314.42, "total_tokens": 1083808} {"current_steps": 840, "total_steps": 12855, "loss": 1.2595, "accuracy": 0.800000011920929, "learning_rate": 4.94750735383168e-05, "epoch": 0.06534422403733955, "percentage": 6.53, "elapsed_time": "0:13:53", "remaining_time": "3:18:44", "throughput": 1314.18, "total_tokens": 1095568} {"current_steps": 850, "total_steps": 12855, "loss": 0.8426, "accuracy": 0.800000011920929, "learning_rate": 4.946254613559803e-05, "epoch": 0.06612213146635551, "percentage": 6.61, "elapsed_time": "0:14:03", "remaining_time": "3:18:33", "throughput": 1317.01, "total_tokens": 1110960} {"current_steps": 860, "total_steps": 12855, "loss": 1.0273, "accuracy": 0.699999988079071, "learning_rate": 4.944987263058863e-05, "epoch": 0.06690003889537145, "percentage": 6.69, "elapsed_time": "0:14:11", "remaining_time": "3:17:51", "throughput": 1317.69, "total_tokens": 1121584} {"current_steps": 870, "total_steps": 12855, "loss": 1.1889, "accuracy": 0.6000000238418579, "learning_rate": 4.9437053098980956e-05, "epoch": 0.0676779463243874, "percentage": 6.77, "elapsed_time": "0:14:21", "remaining_time": "3:17:46", "throughput": 1320.27, "total_tokens": 1137296} {"current_steps": 880, "total_steps": 12855, "loss": 1.1801, "accuracy": 0.800000011920929, "learning_rate": 4.942408761733952e-05, "epoch": 0.06845585375340335, "percentage": 6.85, "elapsed_time": "0:14:31", "remaining_time": "3:17:43", "throughput": 1322.41, "total_tokens": 1152848} {"current_steps": 890, "total_steps": 12855, "loss": 0.9443, "accuracy": 0.800000011920929, "learning_rate": 4.9410976263100515e-05, "epoch": 0.06923376118241929, "percentage": 6.92, "elapsed_time": "0:14:40", "remaining_time": "3:17:11", "throughput": 1322.68, "total_tokens": 1164000} {"current_steps": 900, "total_steps": 12855, "loss": 1.0886, "accuracy": 0.6000000238418579, "learning_rate": 4.9397719114571386e-05, "epoch": 0.07001166861143523, "percentage": 7.0, "elapsed_time": "0:14:48", "remaining_time": "3:16:37", "throughput": 1322.54, "total_tokens": 1174592} {"current_steps": 910, "total_steps": 12855, "loss": 1.0652, "accuracy": 0.6000000238418579, "learning_rate": 4.9384316250930276e-05, "epoch": 0.07078957604045119, "percentage": 7.08, "elapsed_time": "0:14:56", "remaining_time": "3:16:07", "throughput": 1324.13, "total_tokens": 1187040} {"current_steps": 920, "total_steps": 12855, "loss": 0.9786, "accuracy": 0.800000011920929, "learning_rate": 4.937076775222566e-05, "epoch": 0.07156748346946713, "percentage": 7.16, "elapsed_time": "0:15:03", "remaining_time": "3:15:26", "throughput": 1322.58, "total_tokens": 1195472} {"current_steps": 930, "total_steps": 12855, "loss": 0.8377, "accuracy": 0.800000011920929, "learning_rate": 4.93570736993758e-05, "epoch": 0.07234539089848308, "percentage": 7.23, "elapsed_time": "0:15:12", "remaining_time": "3:15:06", "throughput": 1323.27, "total_tokens": 1208128} {"current_steps": 940, "total_steps": 12855, "loss": 0.9847, "accuracy": 0.699999988079071, "learning_rate": 4.934323417416827e-05, "epoch": 0.07312329832749903, "percentage": 7.31, "elapsed_time": "0:15:21", "remaining_time": "3:14:40", "throughput": 1320.69, "total_tokens": 1216976} {"current_steps": 950, "total_steps": 12855, "loss": 1.0711, "accuracy": 0.6000000238418579, "learning_rate": 4.932924925925949e-05, "epoch": 0.07390120575651497, "percentage": 7.39, "elapsed_time": "0:15:33", "remaining_time": "3:15:00", "throughput": 1318.08, "total_tokens": 1230656} {"current_steps": 960, "total_steps": 12855, "loss": 0.9308, "accuracy": 0.6000000238418579, "learning_rate": 4.9315119038174206e-05, "epoch": 0.07467911318553092, "percentage": 7.47, "elapsed_time": "0:15:42", "remaining_time": "3:14:40", "throughput": 1320.72, "total_tokens": 1245024} {"current_steps": 970, "total_steps": 12855, "loss": 1.0159, "accuracy": 1.0, "learning_rate": 4.930084359530502e-05, "epoch": 0.07545702061454687, "percentage": 7.55, "elapsed_time": "0:15:52", "remaining_time": "3:14:32", "throughput": 1323.07, "total_tokens": 1260400} {"current_steps": 980, "total_steps": 12855, "loss": 1.0535, "accuracy": 0.6000000238418579, "learning_rate": 4.9286423015911845e-05, "epoch": 0.07623492804356281, "percentage": 7.62, "elapsed_time": "0:16:00", "remaining_time": "3:14:02", "throughput": 1323.96, "total_tokens": 1272128} {"current_steps": 990, "total_steps": 12855, "loss": 0.8751, "accuracy": 0.8999999761581421, "learning_rate": 4.927185738612145e-05, "epoch": 0.07701283547257877, "percentage": 7.7, "elapsed_time": "0:16:10", "remaining_time": "3:13:45", "throughput": 1325.34, "total_tokens": 1285616} {"current_steps": 1000, "total_steps": 12855, "loss": 1.0701, "accuracy": 0.5, "learning_rate": 4.925714679292689e-05, "epoch": 0.07779074290159471, "percentage": 7.78, "elapsed_time": "0:17:23", "remaining_time": "3:26:09", "throughput": 1249.91, "total_tokens": 1304160} {"current_steps": 1010, "total_steps": 12855, "loss": 0.9235, "accuracy": 0.8999999761581421, "learning_rate": 4.9242291324187024e-05, "epoch": 0.07856865033061065, "percentage": 7.86, "elapsed_time": "0:18:05", "remaining_time": "3:32:12", "throughput": 1213.66, "total_tokens": 1317664} {"current_steps": 1020, "total_steps": 12855, "loss": 1.1205, "accuracy": 0.800000011920929, "learning_rate": 4.9227291068625983e-05, "epoch": 0.07934655775962661, "percentage": 7.93, "elapsed_time": "0:18:33", "remaining_time": "3:35:14", "throughput": 1199.68, "total_tokens": 1335264} {"current_steps": 1030, "total_steps": 12855, "loss": 0.9276, "accuracy": 0.6000000238418579, "learning_rate": 4.921214611583262e-05, "epoch": 0.08012446518864255, "percentage": 8.01, "elapsed_time": "0:18:59", "remaining_time": "3:37:58", "throughput": 1185.46, "total_tokens": 1350464} {"current_steps": 1040, "total_steps": 12855, "loss": 0.9785, "accuracy": 0.4000000059604645, "learning_rate": 4.9196856556260004e-05, "epoch": 0.0809023726176585, "percentage": 8.09, "elapsed_time": "0:19:32", "remaining_time": "3:41:55", "throughput": 1167.27, "total_tokens": 1368112} {"current_steps": 1050, "total_steps": 12855, "loss": 0.8723, "accuracy": 0.8999999761581421, "learning_rate": 4.918142248122488e-05, "epoch": 0.08168028004667445, "percentage": 8.17, "elapsed_time": "0:19:49", "remaining_time": "3:42:49", "throughput": 1161.19, "total_tokens": 1380816} {"current_steps": 1060, "total_steps": 12855, "loss": 1.0289, "accuracy": 0.8999999761581421, "learning_rate": 4.916584398290707e-05, "epoch": 0.08245818747569039, "percentage": 8.25, "elapsed_time": "0:20:10", "remaining_time": "3:44:27", "throughput": 1152.07, "total_tokens": 1394336} {"current_steps": 1070, "total_steps": 12855, "loss": 0.8746, "accuracy": 0.8999999761581421, "learning_rate": 4.915012115434899e-05, "epoch": 0.08323609490470633, "percentage": 8.32, "elapsed_time": "0:20:32", "remaining_time": "3:46:19", "throughput": 1142.19, "total_tokens": 1408224} {"current_steps": 1080, "total_steps": 12855, "loss": 1.15, "accuracy": 0.699999988079071, "learning_rate": 4.913425408945508e-05, "epoch": 0.08401400233372229, "percentage": 8.4, "elapsed_time": "0:20:48", "remaining_time": "3:46:48", "throughput": 1136.26, "total_tokens": 1418224} {"current_steps": 1090, "total_steps": 12855, "loss": 1.2581, "accuracy": 0.5, "learning_rate": 4.911824288299119e-05, "epoch": 0.08479190976273823, "percentage": 8.48, "elapsed_time": "0:21:06", "remaining_time": "3:47:52", "throughput": 1129.66, "total_tokens": 1430928} {"current_steps": 1100, "total_steps": 12855, "loss": 0.878, "accuracy": 0.5, "learning_rate": 4.9102087630584096e-05, "epoch": 0.08556981719175417, "percentage": 8.56, "elapsed_time": "0:21:18", "remaining_time": "3:47:45", "throughput": 1126.75, "total_tokens": 1440912} {"current_steps": 1110, "total_steps": 12855, "loss": 1.06, "accuracy": 0.6000000238418579, "learning_rate": 4.9085788428720845e-05, "epoch": 0.08634772462077013, "percentage": 8.63, "elapsed_time": "0:21:34", "remaining_time": "3:48:17", "throughput": 1120.87, "total_tokens": 1450960} {"current_steps": 1120, "total_steps": 12855, "loss": 0.7924, "accuracy": 0.699999988079071, "learning_rate": 4.9069345374748265e-05, "epoch": 0.08712563204978607, "percentage": 8.71, "elapsed_time": "0:21:54", "remaining_time": "3:49:27", "throughput": 1113.56, "total_tokens": 1463232} {"current_steps": 1130, "total_steps": 12855, "loss": 1.0578, "accuracy": 0.6000000238418579, "learning_rate": 4.9052758566872305e-05, "epoch": 0.08790353947880203, "percentage": 8.79, "elapsed_time": "0:22:18", "remaining_time": "3:51:32", "throughput": 1104.34, "total_tokens": 1478576} {"current_steps": 1140, "total_steps": 12855, "loss": 1.0967, "accuracy": 0.699999988079071, "learning_rate": 4.903602810415749e-05, "epoch": 0.08868144690781797, "percentage": 8.87, "elapsed_time": "0:22:35", "remaining_time": "3:52:05", "throughput": 1099.3, "total_tokens": 1489696} {"current_steps": 1150, "total_steps": 12855, "loss": 0.8442, "accuracy": 0.800000011920929, "learning_rate": 4.901915408652635e-05, "epoch": 0.08945935433683391, "percentage": 8.95, "elapsed_time": "0:23:00", "remaining_time": "3:54:08", "throughput": 1089.1, "total_tokens": 1503280} {"current_steps": 1160, "total_steps": 12855, "loss": 1.0602, "accuracy": 0.800000011920929, "learning_rate": 4.900213661475874e-05, "epoch": 0.09023726176584987, "percentage": 9.02, "elapsed_time": "0:23:23", "remaining_time": "3:55:48", "throughput": 1082.01, "total_tokens": 1518464} {"current_steps": 1170, "total_steps": 12855, "loss": 1.1269, "accuracy": 0.4000000059604645, "learning_rate": 4.898497579049135e-05, "epoch": 0.09101516919486581, "percentage": 9.1, "elapsed_time": "0:23:46", "remaining_time": "3:57:30", "throughput": 1075.11, "total_tokens": 1534032} {"current_steps": 1180, "total_steps": 12855, "loss": 0.8111, "accuracy": 0.8999999761581421, "learning_rate": 4.8967671716217e-05, "epoch": 0.09179307662388175, "percentage": 9.18, "elapsed_time": "0:24:18", "remaining_time": "4:00:34", "throughput": 1062.24, "total_tokens": 1549760} {"current_steps": 1190, "total_steps": 12855, "loss": 1.0743, "accuracy": 0.699999988079071, "learning_rate": 4.8950224495284095e-05, "epoch": 0.09257098405289771, "percentage": 9.26, "elapsed_time": "0:24:55", "remaining_time": "4:04:21", "throughput": 1048.39, "total_tokens": 1568048} {"current_steps": 1200, "total_steps": 12855, "loss": 1.0317, "accuracy": 0.800000011920929, "learning_rate": 4.893263423189597e-05, "epoch": 0.09334889148191365, "percentage": 9.33, "elapsed_time": "0:25:13", "remaining_time": "4:04:56", "throughput": 1044.71, "total_tokens": 1580768} {"current_steps": 1210, "total_steps": 12855, "loss": 0.9136, "accuracy": 0.699999988079071, "learning_rate": 4.891490103111027e-05, "epoch": 0.0941267989109296, "percentage": 9.41, "elapsed_time": "0:25:26", "remaining_time": "4:04:53", "throughput": 1043.04, "total_tokens": 1592448} {"current_steps": 1220, "total_steps": 12855, "loss": 0.9607, "accuracy": 0.8999999761581421, "learning_rate": 4.8897024998838363e-05, "epoch": 0.09490470633994555, "percentage": 9.49, "elapsed_time": "0:25:41", "remaining_time": "4:05:04", "throughput": 1041.19, "total_tokens": 1605392} {"current_steps": 1230, "total_steps": 12855, "loss": 0.8907, "accuracy": 0.800000011920929, "learning_rate": 4.887900624184465e-05, "epoch": 0.09568261376896149, "percentage": 9.57, "elapsed_time": "0:26:00", "remaining_time": "4:05:50", "throughput": 1037.78, "total_tokens": 1619680} {"current_steps": 1240, "total_steps": 12855, "loss": 0.9652, "accuracy": 0.8999999761581421, "learning_rate": 4.886084486774596e-05, "epoch": 0.09646052119797745, "percentage": 9.65, "elapsed_time": "0:26:20", "remaining_time": "4:06:44", "throughput": 1034.74, "total_tokens": 1635408} {"current_steps": 1250, "total_steps": 12855, "loss": 0.8558, "accuracy": 0.800000011920929, "learning_rate": 4.8842540985010896e-05, "epoch": 0.09723842862699339, "percentage": 9.72, "elapsed_time": "0:26:37", "remaining_time": "4:07:14", "throughput": 1032.73, "total_tokens": 1650128} {"current_steps": 1260, "total_steps": 12855, "loss": 1.0799, "accuracy": 0.699999988079071, "learning_rate": 4.882409470295921e-05, "epoch": 0.09801633605600933, "percentage": 9.8, "elapsed_time": "0:27:03", "remaining_time": "4:08:59", "throughput": 1022.75, "total_tokens": 1660384} {"current_steps": 1270, "total_steps": 12855, "loss": 1.1986, "accuracy": 1.0, "learning_rate": 4.880550613176111e-05, "epoch": 0.09879424348502529, "percentage": 9.88, "elapsed_time": "0:27:34", "remaining_time": "4:11:35", "throughput": 1014.63, "total_tokens": 1679104} {"current_steps": 1280, "total_steps": 12855, "loss": 1.0842, "accuracy": 0.800000011920929, "learning_rate": 4.8786775382436646e-05, "epoch": 0.09957215091404123, "percentage": 9.96, "elapsed_time": "0:28:08", "remaining_time": "4:14:26", "throughput": 1003.73, "total_tokens": 1694560} {"current_steps": 1290, "total_steps": 12855, "loss": 0.8518, "accuracy": 0.699999988079071, "learning_rate": 4.8767902566855004e-05, "epoch": 0.10035005834305717, "percentage": 10.04, "elapsed_time": "0:28:40", "remaining_time": "4:17:05", "throughput": 992.83, "total_tokens": 1708288} {"current_steps": 1300, "total_steps": 12855, "loss": 0.9644, "accuracy": 0.800000011920929, "learning_rate": 4.874888779773388e-05, "epoch": 0.10112796577207313, "percentage": 10.11, "elapsed_time": "0:29:01", "remaining_time": "4:17:56", "throughput": 989.57, "total_tokens": 1723024} {"current_steps": 1310, "total_steps": 12855, "loss": 0.8717, "accuracy": 0.8999999761581421, "learning_rate": 4.872973118863877e-05, "epoch": 0.10190587320108907, "percentage": 10.19, "elapsed_time": "0:29:13", "remaining_time": "4:17:31", "throughput": 987.73, "total_tokens": 1731728} {"current_steps": 1320, "total_steps": 12855, "loss": 0.9145, "accuracy": 0.8999999761581421, "learning_rate": 4.871043285398231e-05, "epoch": 0.10268378063010501, "percentage": 10.27, "elapsed_time": "0:29:27", "remaining_time": "4:17:26", "throughput": 986.37, "total_tokens": 1743568} {"current_steps": 1330, "total_steps": 12855, "loss": 0.954, "accuracy": 0.8999999761581421, "learning_rate": 4.8690992909023606e-05, "epoch": 0.10346168805912097, "percentage": 10.35, "elapsed_time": "0:29:40", "remaining_time": "4:17:12", "throughput": 986.15, "total_tokens": 1756272} {"current_steps": 1340, "total_steps": 12855, "loss": 0.8471, "accuracy": 0.800000011920929, "learning_rate": 4.86714114698675e-05, "epoch": 0.10423959548813691, "percentage": 10.42, "elapsed_time": "0:30:00", "remaining_time": "4:17:47", "throughput": 982.96, "total_tokens": 1769328} {"current_steps": 1350, "total_steps": 12855, "loss": 0.9921, "accuracy": 0.6000000238418579, "learning_rate": 4.865168865346393e-05, "epoch": 0.10501750291715285, "percentage": 10.5, "elapsed_time": "0:30:20", "remaining_time": "4:18:38", "throughput": 979.47, "total_tokens": 1783504} {"current_steps": 1360, "total_steps": 12855, "loss": 1.0608, "accuracy": 0.699999988079071, "learning_rate": 4.863182457760722e-05, "epoch": 0.10579541034616881, "percentage": 10.58, "elapsed_time": "0:31:00", "remaining_time": "4:22:04", "throughput": 969.95, "total_tokens": 1804496} {"current_steps": 1370, "total_steps": 12855, "loss": 0.9693, "accuracy": 0.5, "learning_rate": 4.861181936093533e-05, "epoch": 0.10657331777518475, "percentage": 10.66, "elapsed_time": "0:31:17", "remaining_time": "4:22:21", "throughput": 967.69, "total_tokens": 1817024} {"current_steps": 1380, "total_steps": 12855, "loss": 1.1456, "accuracy": 0.6000000238418579, "learning_rate": 4.859167312292919e-05, "epoch": 0.1073512252042007, "percentage": 10.74, "elapsed_time": "0:31:26", "remaining_time": "4:21:28", "throughput": 967.3, "total_tokens": 1824992} {"current_steps": 1390, "total_steps": 12855, "loss": 0.9373, "accuracy": 0.699999988079071, "learning_rate": 4.857138598391201e-05, "epoch": 0.10812913263321665, "percentage": 10.81, "elapsed_time": "0:31:42", "remaining_time": "4:21:33", "throughput": 965.29, "total_tokens": 1836608} {"current_steps": 1400, "total_steps": 12855, "loss": 0.9069, "accuracy": 0.800000011920929, "learning_rate": 4.855095806504849e-05, "epoch": 0.10890704006223259, "percentage": 10.89, "elapsed_time": "0:32:00", "remaining_time": "4:21:53", "throughput": 963.65, "total_tokens": 1850608} {"current_steps": 1410, "total_steps": 12855, "loss": 1.3462, "accuracy": 0.5, "learning_rate": 4.8530389488344176e-05, "epoch": 0.10968494749124855, "percentage": 10.97, "elapsed_time": "0:32:19", "remaining_time": "4:22:20", "throughput": 960.81, "total_tokens": 1863232} {"current_steps": 1420, "total_steps": 12855, "loss": 0.8495, "accuracy": 1.0, "learning_rate": 4.850968037664463e-05, "epoch": 0.11046285492026449, "percentage": 11.05, "elapsed_time": "0:32:35", "remaining_time": "4:22:28", "throughput": 958.51, "total_tokens": 1874480} {"current_steps": 1430, "total_steps": 12855, "loss": 0.9673, "accuracy": 0.6000000238418579, "learning_rate": 4.8488830853634835e-05, "epoch": 0.11124076234928043, "percentage": 11.12, "elapsed_time": "0:32:47", "remaining_time": "4:22:01", "throughput": 957.82, "total_tokens": 1884768} {"current_steps": 1440, "total_steps": 12855, "loss": 1.0608, "accuracy": 0.800000011920929, "learning_rate": 4.8467841043838315e-05, "epoch": 0.11201866977829639, "percentage": 11.2, "elapsed_time": "0:33:02", "remaining_time": "4:21:52", "throughput": 957.15, "total_tokens": 1897216} {"current_steps": 1450, "total_steps": 12855, "loss": 1.1853, "accuracy": 0.8999999761581421, "learning_rate": 4.844671107261649e-05, "epoch": 0.11279657720731233, "percentage": 11.28, "elapsed_time": "0:33:16", "remaining_time": "4:21:46", "throughput": 955.68, "total_tokens": 1908384} {"current_steps": 1460, "total_steps": 12855, "loss": 1.0162, "accuracy": 0.6000000238418579, "learning_rate": 4.842544106616789e-05, "epoch": 0.11357448463632827, "percentage": 11.36, "elapsed_time": "0:33:41", "remaining_time": "4:22:57", "throughput": 951.55, "total_tokens": 1923600} {"current_steps": 1470, "total_steps": 12855, "loss": 0.9941, "accuracy": 0.8999999761581421, "learning_rate": 4.8404031151527375e-05, "epoch": 0.11435239206534423, "percentage": 11.44, "elapsed_time": "0:34:15", "remaining_time": "4:25:20", "throughput": 943.55, "total_tokens": 1939600} {"current_steps": 1480, "total_steps": 12855, "loss": 1.0903, "accuracy": 0.699999988079071, "learning_rate": 4.838248145656545e-05, "epoch": 0.11513029949436017, "percentage": 11.51, "elapsed_time": "0:34:28", "remaining_time": "4:24:56", "throughput": 943.23, "total_tokens": 1950864} {"current_steps": 1490, "total_steps": 12855, "loss": 1.2121, "accuracy": 0.699999988079071, "learning_rate": 4.836079210998743e-05, "epoch": 0.11590820692337611, "percentage": 11.59, "elapsed_time": "0:34:44", "remaining_time": "4:24:59", "throughput": 940.72, "total_tokens": 1960960} {"current_steps": 1500, "total_steps": 12855, "loss": 0.661, "accuracy": 0.699999988079071, "learning_rate": 4.833896324133269e-05, "epoch": 0.11668611435239207, "percentage": 11.67, "elapsed_time": "0:35:04", "remaining_time": "4:25:28", "throughput": 938.29, "total_tokens": 1974304} {"current_steps": 1510, "total_steps": 12855, "loss": 0.9237, "accuracy": 0.699999988079071, "learning_rate": 4.8316994980973924e-05, "epoch": 0.11746402178140801, "percentage": 11.75, "elapsed_time": "0:35:22", "remaining_time": "4:25:46", "throughput": 936.46, "total_tokens": 1987552} {"current_steps": 1520, "total_steps": 12855, "loss": 0.9495, "accuracy": 0.699999988079071, "learning_rate": 4.8294887460116315e-05, "epoch": 0.11824192921042397, "percentage": 11.82, "elapsed_time": "0:35:48", "remaining_time": "4:27:01", "throughput": 932.77, "total_tokens": 2004064} {"current_steps": 1530, "total_steps": 12855, "loss": 1.0902, "accuracy": 0.800000011920929, "learning_rate": 4.82726408107968e-05, "epoch": 0.11901983663943991, "percentage": 11.9, "elapsed_time": "0:36:07", "remaining_time": "4:27:23", "throughput": 930.49, "total_tokens": 2016864} {"current_steps": 1540, "total_steps": 12855, "loss": 1.2516, "accuracy": 0.699999988079071, "learning_rate": 4.825025516588325e-05, "epoch": 0.11979774406845585, "percentage": 11.98, "elapsed_time": "0:36:37", "remaining_time": "4:29:06", "throughput": 925.81, "total_tokens": 2034576} {"current_steps": 1550, "total_steps": 12855, "loss": 0.9078, "accuracy": 1.0, "learning_rate": 4.822773065907368e-05, "epoch": 0.1205756514974718, "percentage": 12.06, "elapsed_time": "0:37:00", "remaining_time": "4:29:53", "throughput": 922.79, "total_tokens": 2048816} {"current_steps": 1560, "total_steps": 12855, "loss": 1.0768, "accuracy": 0.6000000238418579, "learning_rate": 4.8205067424895464e-05, "epoch": 0.12135355892648775, "percentage": 12.14, "elapsed_time": "0:37:12", "remaining_time": "4:29:27", "throughput": 922.32, "total_tokens": 2059440} {"current_steps": 1570, "total_steps": 12855, "loss": 1.1554, "accuracy": 0.699999988079071, "learning_rate": 4.8182265598704536e-05, "epoch": 0.12213146635550369, "percentage": 12.21, "elapsed_time": "0:37:42", "remaining_time": "4:31:05", "throughput": 917.72, "total_tokens": 2076736} {"current_steps": 1580, "total_steps": 12855, "loss": 0.7018, "accuracy": 1.0, "learning_rate": 4.8159325316684524e-05, "epoch": 0.12290937378451965, "percentage": 12.29, "elapsed_time": "0:37:55", "remaining_time": "4:30:35", "throughput": 917.58, "total_tokens": 2087664} {"current_steps": 1590, "total_steps": 12855, "loss": 0.8094, "accuracy": 1.0, "learning_rate": 4.813624671584604e-05, "epoch": 0.12368728121353559, "percentage": 12.37, "elapsed_time": "0:38:16", "remaining_time": "4:31:07", "throughput": 915.41, "total_tokens": 2101888} {"current_steps": 1600, "total_steps": 12855, "loss": 0.9019, "accuracy": 0.8999999761581421, "learning_rate": 4.811302993402576e-05, "epoch": 0.12446518864255153, "percentage": 12.45, "elapsed_time": "0:38:29", "remaining_time": "4:30:48", "throughput": 915.13, "total_tokens": 2113792} {"current_steps": 1610, "total_steps": 12855, "loss": 0.8562, "accuracy": 0.800000011920929, "learning_rate": 4.808967510988567e-05, "epoch": 0.12524309607156747, "percentage": 12.52, "elapsed_time": "0:38:47", "remaining_time": "4:30:55", "throughput": 914.43, "total_tokens": 2128176} {"current_steps": 1620, "total_steps": 12855, "loss": 1.0377, "accuracy": 0.699999988079071, "learning_rate": 4.806618238291221e-05, "epoch": 0.12602100350058343, "percentage": 12.6, "elapsed_time": "0:38:58", "remaining_time": "4:30:19", "throughput": 914.08, "total_tokens": 2137808} {"current_steps": 1630, "total_steps": 12855, "loss": 0.9564, "accuracy": 0.8999999761581421, "learning_rate": 4.8042551893415413e-05, "epoch": 0.12679891092959938, "percentage": 12.68, "elapsed_time": "0:39:14", "remaining_time": "4:30:11", "throughput": 913.06, "total_tokens": 2149376} {"current_steps": 1640, "total_steps": 12855, "loss": 0.9976, "accuracy": 0.8999999761581421, "learning_rate": 4.801878378252814e-05, "epoch": 0.1275768183586153, "percentage": 12.76, "elapsed_time": "0:39:31", "remaining_time": "4:30:14", "throughput": 911.97, "total_tokens": 2162304} {"current_steps": 1650, "total_steps": 12855, "loss": 0.9256, "accuracy": 0.8999999761581421, "learning_rate": 4.799487819220516e-05, "epoch": 0.12835472578763127, "percentage": 12.84, "elapsed_time": "0:39:46", "remaining_time": "4:30:04", "throughput": 911.45, "total_tokens": 2174896} {"current_steps": 1660, "total_steps": 12855, "loss": 0.8614, "accuracy": 0.699999988079071, "learning_rate": 4.7970835265222374e-05, "epoch": 0.12913263321664722, "percentage": 12.91, "elapsed_time": "0:40:05", "remaining_time": "4:30:22", "throughput": 910.06, "total_tokens": 2189168} {"current_steps": 1670, "total_steps": 12855, "loss": 0.7921, "accuracy": 0.8999999761581421, "learning_rate": 4.794665514517588e-05, "epoch": 0.12991054064566315, "percentage": 12.99, "elapsed_time": "0:40:19", "remaining_time": "4:30:02", "throughput": 909.44, "total_tokens": 2200080} {"current_steps": 1680, "total_steps": 12855, "loss": 0.9724, "accuracy": 0.6000000238418579, "learning_rate": 4.792233797648119e-05, "epoch": 0.1306884480746791, "percentage": 13.07, "elapsed_time": "0:40:30", "remaining_time": "4:29:24", "throughput": 909.57, "total_tokens": 2210304} {"current_steps": 1690, "total_steps": 12855, "loss": 0.9342, "accuracy": 0.699999988079071, "learning_rate": 4.789788390437233e-05, "epoch": 0.13146635550369506, "percentage": 13.15, "elapsed_time": "0:40:45", "remaining_time": "4:29:16", "throughput": 908.96, "total_tokens": 2222928} {"current_steps": 1700, "total_steps": 12855, "loss": 1.0041, "accuracy": 0.800000011920929, "learning_rate": 4.7873293074900984e-05, "epoch": 0.13224426293271102, "percentage": 13.22, "elapsed_time": "0:41:00", "remaining_time": "4:29:07", "throughput": 908.64, "total_tokens": 2235984} {"current_steps": 1710, "total_steps": 12855, "loss": 1.0628, "accuracy": 0.5, "learning_rate": 4.7848565634935605e-05, "epoch": 0.13302217036172695, "percentage": 13.3, "elapsed_time": "0:41:12", "remaining_time": "4:28:37", "throughput": 907.92, "total_tokens": 2245280} {"current_steps": 1720, "total_steps": 12855, "loss": 0.9457, "accuracy": 0.699999988079071, "learning_rate": 4.782370173216056e-05, "epoch": 0.1338000777907429, "percentage": 13.38, "elapsed_time": "0:41:30", "remaining_time": "4:28:44", "throughput": 907.26, "total_tokens": 2259712} {"current_steps": 1730, "total_steps": 12855, "loss": 1.0156, "accuracy": 0.800000011920929, "learning_rate": 4.7798701515075236e-05, "epoch": 0.13457798521975886, "percentage": 13.46, "elapsed_time": "0:41:52", "remaining_time": "4:29:17", "throughput": 905.56, "total_tokens": 2275328} {"current_steps": 1740, "total_steps": 12855, "loss": 1.2947, "accuracy": 0.6000000238418579, "learning_rate": 4.777356513299317e-05, "epoch": 0.1353558926487748, "percentage": 13.54, "elapsed_time": "0:42:05", "remaining_time": "4:28:49", "throughput": 904.96, "total_tokens": 2285040} {"current_steps": 1750, "total_steps": 12855, "loss": 1.0739, "accuracy": 0.5, "learning_rate": 4.7748292736041114e-05, "epoch": 0.13613380007779075, "percentage": 13.61, "elapsed_time": "0:42:21", "remaining_time": "4:28:44", "throughput": 903.94, "total_tokens": 2296960} {"current_steps": 1760, "total_steps": 12855, "loss": 0.811, "accuracy": 0.800000011920929, "learning_rate": 4.77228844751582e-05, "epoch": 0.1369117075068067, "percentage": 13.69, "elapsed_time": "0:42:34", "remaining_time": "4:28:23", "throughput": 903.33, "total_tokens": 2307584} {"current_steps": 1770, "total_steps": 12855, "loss": 1.0189, "accuracy": 0.800000011920929, "learning_rate": 4.769734050209498e-05, "epoch": 0.13768961493582263, "percentage": 13.77, "elapsed_time": "0:42:57", "remaining_time": "4:29:00", "throughput": 901.19, "total_tokens": 2322576} {"current_steps": 1780, "total_steps": 12855, "loss": 0.9899, "accuracy": 0.800000011920929, "learning_rate": 4.7671660969412556e-05, "epoch": 0.13846752236483859, "percentage": 13.85, "elapsed_time": "0:43:08", "remaining_time": "4:28:23", "throughput": 901.18, "total_tokens": 2332432} {"current_steps": 1790, "total_steps": 12855, "loss": 0.9868, "accuracy": 0.8999999761581421, "learning_rate": 4.7645846030481656e-05, "epoch": 0.13924542979385454, "percentage": 13.92, "elapsed_time": "0:43:29", "remaining_time": "4:28:51", "throughput": 898.72, "total_tokens": 2345360} {"current_steps": 1800, "total_steps": 12855, "loss": 1.2197, "accuracy": 0.8999999761581421, "learning_rate": 4.761989583948173e-05, "epoch": 0.14002333722287047, "percentage": 14.0, "elapsed_time": "0:43:44", "remaining_time": "4:28:36", "throughput": 898.08, "total_tokens": 2356688} {"current_steps": 1810, "total_steps": 12855, "loss": 1.2146, "accuracy": 0.699999988079071, "learning_rate": 4.7593810551399996e-05, "epoch": 0.14080124465188643, "percentage": 14.08, "elapsed_time": "0:43:59", "remaining_time": "4:28:26", "throughput": 897.2, "total_tokens": 2368128} {"current_steps": 1820, "total_steps": 12855, "loss": 0.8944, "accuracy": 0.8999999761581421, "learning_rate": 4.756759032203058e-05, "epoch": 0.14157915208090238, "percentage": 14.16, "elapsed_time": "0:44:15", "remaining_time": "4:28:19", "throughput": 896.09, "total_tokens": 2379456} {"current_steps": 1830, "total_steps": 12855, "loss": 1.0135, "accuracy": 0.699999988079071, "learning_rate": 4.754123530797349e-05, "epoch": 0.1423570595099183, "percentage": 14.24, "elapsed_time": "0:44:28", "remaining_time": "4:27:57", "throughput": 895.8, "total_tokens": 2390576} {"current_steps": 1840, "total_steps": 12855, "loss": 1.0258, "accuracy": 0.8999999761581421, "learning_rate": 4.7514745666633765e-05, "epoch": 0.14313496693893427, "percentage": 14.31, "elapsed_time": "0:44:43", "remaining_time": "4:27:46", "throughput": 895.64, "total_tokens": 2403664} {"current_steps": 1850, "total_steps": 12855, "loss": 1.2283, "accuracy": 0.800000011920929, "learning_rate": 4.748812155622051e-05, "epoch": 0.14391287436795022, "percentage": 14.39, "elapsed_time": "0:44:54", "remaining_time": "4:27:10", "throughput": 895.44, "total_tokens": 2412992} {"current_steps": 1860, "total_steps": 12855, "loss": 1.0447, "accuracy": 0.6000000238418579, "learning_rate": 4.746136313574593e-05, "epoch": 0.14469078179696615, "percentage": 14.47, "elapsed_time": "0:45:10", "remaining_time": "4:27:05", "throughput": 894.74, "total_tokens": 2425600} {"current_steps": 1870, "total_steps": 12855, "loss": 1.0503, "accuracy": 0.699999988079071, "learning_rate": 4.74344705650244e-05, "epoch": 0.1454686892259821, "percentage": 14.55, "elapsed_time": "0:45:21", "remaining_time": "4:26:29", "throughput": 894.57, "total_tokens": 2434992} {"current_steps": 1880, "total_steps": 12855, "loss": 1.0229, "accuracy": 0.8999999761581421, "learning_rate": 4.74074440046715e-05, "epoch": 0.14624659665499806, "percentage": 14.62, "elapsed_time": "0:45:44", "remaining_time": "4:27:01", "throughput": 892.59, "total_tokens": 2449712} {"current_steps": 1890, "total_steps": 12855, "loss": 1.0202, "accuracy": 0.8999999761581421, "learning_rate": 4.738028361610308e-05, "epoch": 0.147024504084014, "percentage": 14.7, "elapsed_time": "0:46:09", "remaining_time": "4:27:48", "throughput": 890.46, "total_tokens": 2466224} {"current_steps": 1900, "total_steps": 12855, "loss": 0.8636, "accuracy": 0.8999999761581421, "learning_rate": 4.7352989561534254e-05, "epoch": 0.14780241151302995, "percentage": 14.78, "elapsed_time": "0:46:31", "remaining_time": "4:28:15", "throughput": 889.11, "total_tokens": 2481952} {"current_steps": 1910, "total_steps": 12855, "loss": 0.8538, "accuracy": 0.5, "learning_rate": 4.732556200397848e-05, "epoch": 0.1485803189420459, "percentage": 14.86, "elapsed_time": "0:46:49", "remaining_time": "4:28:21", "throughput": 888.18, "total_tokens": 2495664} {"current_steps": 1920, "total_steps": 12855, "loss": 1.0023, "accuracy": 0.699999988079071, "learning_rate": 4.729800110724654e-05, "epoch": 0.14935822637106183, "percentage": 14.94, "elapsed_time": "0:47:14", "remaining_time": "4:29:05", "throughput": 886.43, "total_tokens": 2512992} {"current_steps": 1930, "total_steps": 12855, "loss": 1.0211, "accuracy": 0.699999988079071, "learning_rate": 4.727030703594557e-05, "epoch": 0.1501361338000778, "percentage": 15.01, "elapsed_time": "0:47:37", "remaining_time": "4:29:35", "throughput": 885.11, "total_tokens": 2529264} {"current_steps": 1940, "total_steps": 12855, "loss": 0.8893, "accuracy": 0.699999988079071, "learning_rate": 4.7242479955478145e-05, "epoch": 0.15091404122909374, "percentage": 15.09, "elapsed_time": "0:47:48", "remaining_time": "4:28:57", "throughput": 884.8, "total_tokens": 2537824} {"current_steps": 1950, "total_steps": 12855, "loss": 0.8987, "accuracy": 1.0, "learning_rate": 4.721452003204118e-05, "epoch": 0.1516919486581097, "percentage": 15.17, "elapsed_time": "0:48:05", "remaining_time": "4:28:57", "throughput": 884.11, "total_tokens": 2551184} {"current_steps": 1960, "total_steps": 12855, "loss": 0.7254, "accuracy": 1.0, "learning_rate": 4.7186427432625005e-05, "epoch": 0.15246985608712563, "percentage": 15.25, "elapsed_time": "0:48:31", "remaining_time": "4:29:42", "throughput": 882.29, "total_tokens": 2568528} {"current_steps": 1970, "total_steps": 12855, "loss": 1.064, "accuracy": 0.699999988079071, "learning_rate": 4.715820232501239e-05, "epoch": 0.15324776351614158, "percentage": 15.32, "elapsed_time": "0:48:51", "remaining_time": "4:29:56", "throughput": 881.14, "total_tokens": 2582928} {"current_steps": 1980, "total_steps": 12855, "loss": 1.0163, "accuracy": 0.699999988079071, "learning_rate": 4.7129844877777456e-05, "epoch": 0.15402567094515754, "percentage": 15.4, "elapsed_time": "0:49:05", "remaining_time": "4:29:39", "throughput": 881.13, "total_tokens": 2595600} {"current_steps": 1990, "total_steps": 12855, "loss": 1.0394, "accuracy": 0.800000011920929, "learning_rate": 4.710135526028477e-05, "epoch": 0.15480357837417347, "percentage": 15.48, "elapsed_time": "0:49:46", "remaining_time": "4:31:42", "throughput": 876.27, "total_tokens": 2616560} {"current_steps": 2000, "total_steps": 12855, "loss": 1.2625, "accuracy": 0.8999999761581421, "learning_rate": 4.707273364268825e-05, "epoch": 0.15558148580318942, "percentage": 15.56, "elapsed_time": "0:50:02", "remaining_time": "4:31:35", "throughput": 875.84, "total_tokens": 2629616} {"current_steps": 2010, "total_steps": 12855, "loss": 1.0967, "accuracy": 0.699999988079071, "learning_rate": 4.70439801959302e-05, "epoch": 0.15635939323220538, "percentage": 15.64, "elapsed_time": "0:50:29", "remaining_time": "4:32:27", "throughput": 872.41, "total_tokens": 2643328} {"current_steps": 2020, "total_steps": 12855, "loss": 0.9446, "accuracy": 0.8999999761581421, "learning_rate": 4.701509509174027e-05, "epoch": 0.1571373006612213, "percentage": 15.71, "elapsed_time": "0:51:02", "remaining_time": "4:33:49", "throughput": 866.2, "total_tokens": 2653136} {"current_steps": 2030, "total_steps": 12855, "loss": 1.036, "accuracy": 0.800000011920929, "learning_rate": 4.698607850263442e-05, "epoch": 0.15791520809023726, "percentage": 15.79, "elapsed_time": "0:51:25", "remaining_time": "4:34:13", "throughput": 862.79, "total_tokens": 2662192} {"current_steps": 2040, "total_steps": 12855, "loss": 1.069, "accuracy": 0.699999988079071, "learning_rate": 4.6956930601913924e-05, "epoch": 0.15869311551925322, "percentage": 15.87, "elapsed_time": "0:52:00", "remaining_time": "4:35:40", "throughput": 858.15, "total_tokens": 2677456} {"current_steps": 2050, "total_steps": 12855, "loss": 0.7734, "accuracy": 0.699999988079071, "learning_rate": 4.6927651563664296e-05, "epoch": 0.15947102294826915, "percentage": 15.95, "elapsed_time": "0:52:28", "remaining_time": "4:36:35", "throughput": 855.28, "total_tokens": 2692944} {"current_steps": 2060, "total_steps": 12855, "loss": 0.8686, "accuracy": 0.6000000238418579, "learning_rate": 4.689824156275428e-05, "epoch": 0.1602489303772851, "percentage": 16.02, "elapsed_time": "0:52:47", "remaining_time": "4:36:39", "throughput": 853.61, "total_tokens": 2703904} {"current_steps": 2070, "total_steps": 12855, "loss": 1.1021, "accuracy": 0.8999999761581421, "learning_rate": 4.686870077483478e-05, "epoch": 0.16102683780630106, "percentage": 16.1, "elapsed_time": "0:53:01", "remaining_time": "4:36:14", "throughput": 853.16, "total_tokens": 2714112} {"current_steps": 2080, "total_steps": 12855, "loss": 0.9435, "accuracy": 0.800000011920929, "learning_rate": 4.6839029376337825e-05, "epoch": 0.161804745235317, "percentage": 16.18, "elapsed_time": "0:53:21", "remaining_time": "4:36:22", "throughput": 852.4, "total_tokens": 2728544} {"current_steps": 2090, "total_steps": 12855, "loss": 1.0744, "accuracy": 0.8999999761581421, "learning_rate": 4.680922754447554e-05, "epoch": 0.16258265266433294, "percentage": 16.26, "elapsed_time": "0:53:45", "remaining_time": "4:36:53", "throughput": 850.31, "total_tokens": 2742592} {"current_steps": 2100, "total_steps": 12855, "loss": 0.8857, "accuracy": 0.800000011920929, "learning_rate": 4.6779295457239025e-05, "epoch": 0.1633605600933489, "percentage": 16.34, "elapsed_time": "0:53:58", "remaining_time": "4:36:25", "throughput": 850.45, "total_tokens": 2754208} {"current_steps": 2110, "total_steps": 12855, "loss": 0.8577, "accuracy": 0.800000011920929, "learning_rate": 4.6749233293397346e-05, "epoch": 0.16413846752236483, "percentage": 16.41, "elapsed_time": "0:54:13", "remaining_time": "4:36:09", "throughput": 849.38, "total_tokens": 2763648} {"current_steps": 2120, "total_steps": 12855, "loss": 0.7813, "accuracy": 1.0, "learning_rate": 4.671904123249645e-05, "epoch": 0.16491637495138078, "percentage": 16.49, "elapsed_time": "0:54:39", "remaining_time": "4:36:44", "throughput": 847.2, "total_tokens": 2778096} {"current_steps": 2130, "total_steps": 12855, "loss": 0.9546, "accuracy": 0.8999999761581421, "learning_rate": 4.66887194548581e-05, "epoch": 0.16569428238039674, "percentage": 16.57, "elapsed_time": "0:54:55", "remaining_time": "4:36:31", "throughput": 846.63, "total_tokens": 2789712} {"current_steps": 2140, "total_steps": 12855, "loss": 1.0925, "accuracy": 0.6000000238418579, "learning_rate": 4.665826814157878e-05, "epoch": 0.16647218980941267, "percentage": 16.65, "elapsed_time": "0:55:16", "remaining_time": "4:36:46", "throughput": 845.9, "total_tokens": 2805600} {"current_steps": 2150, "total_steps": 12855, "loss": 0.86, "accuracy": 0.8999999761581421, "learning_rate": 4.662768747452862e-05, "epoch": 0.16725009723842862, "percentage": 16.73, "elapsed_time": "0:55:29", "remaining_time": "4:36:17", "throughput": 846.05, "total_tokens": 2816848} {"current_steps": 2160, "total_steps": 12855, "loss": 1.2139, "accuracy": 0.699999988079071, "learning_rate": 4.6596977636350325e-05, "epoch": 0.16802800466744458, "percentage": 16.8, "elapsed_time": "0:55:41", "remaining_time": "4:35:46", "throughput": 846.1, "total_tokens": 2827472} {"current_steps": 2170, "total_steps": 12855, "loss": 0.8659, "accuracy": 0.800000011920929, "learning_rate": 4.656613881045808e-05, "epoch": 0.1688059120964605, "percentage": 16.88, "elapsed_time": "0:55:56", "remaining_time": "4:35:25", "throughput": 846.18, "total_tokens": 2839984} {"current_steps": 2180, "total_steps": 12855, "loss": 0.8124, "accuracy": 0.800000011920929, "learning_rate": 4.653517118103642e-05, "epoch": 0.16958381952547646, "percentage": 16.96, "elapsed_time": "0:56:10", "remaining_time": "4:35:04", "throughput": 845.9, "total_tokens": 2851120} {"current_steps": 2190, "total_steps": 12855, "loss": 0.7893, "accuracy": 0.800000011920929, "learning_rate": 4.6504074933039185e-05, "epoch": 0.17036172695449242, "percentage": 17.04, "elapsed_time": "0:56:21", "remaining_time": "4:34:25", "throughput": 845.9, "total_tokens": 2859984} {"current_steps": 2200, "total_steps": 12855, "loss": 1.2555, "accuracy": 0.699999988079071, "learning_rate": 4.647285025218837e-05, "epoch": 0.17113963438350835, "percentage": 17.11, "elapsed_time": "0:56:45", "remaining_time": "4:34:51", "throughput": 844.83, "total_tokens": 2876672} {"current_steps": 2210, "total_steps": 12855, "loss": 1.0537, "accuracy": 0.6000000238418579, "learning_rate": 4.644149732497305e-05, "epoch": 0.1719175418125243, "percentage": 17.19, "elapsed_time": "0:56:56", "remaining_time": "4:34:16", "throughput": 845.16, "total_tokens": 2887568} {"current_steps": 2220, "total_steps": 12855, "loss": 1.0015, "accuracy": 0.800000011920929, "learning_rate": 4.6410016338648246e-05, "epoch": 0.17269544924154026, "percentage": 17.27, "elapsed_time": "0:57:13", "remaining_time": "4:34:08", "throughput": 845.14, "total_tokens": 2901824} {"current_steps": 2230, "total_steps": 12855, "loss": 1.2448, "accuracy": 0.6000000238418579, "learning_rate": 4.637840748123379e-05, "epoch": 0.17347335667055622, "percentage": 17.35, "elapsed_time": "0:57:32", "remaining_time": "4:34:07", "throughput": 844.18, "total_tokens": 2914160} {"current_steps": 2240, "total_steps": 12855, "loss": 0.9599, "accuracy": 0.8999999761581421, "learning_rate": 4.634667094151325e-05, "epoch": 0.17425126409957215, "percentage": 17.43, "elapsed_time": "0:57:43", "remaining_time": "4:33:32", "throughput": 844.57, "total_tokens": 2925072} {"current_steps": 2250, "total_steps": 12855, "loss": 0.8628, "accuracy": 0.8999999761581421, "learning_rate": 4.6314806909032766e-05, "epoch": 0.1750291715285881, "percentage": 17.5, "elapsed_time": "0:58:04", "remaining_time": "4:33:41", "throughput": 843.93, "total_tokens": 2940336} {"current_steps": 2260, "total_steps": 12855, "loss": 0.9506, "accuracy": 0.8999999761581421, "learning_rate": 4.6282815574099915e-05, "epoch": 0.17580707895760406, "percentage": 17.58, "elapsed_time": "0:58:23", "remaining_time": "4:33:43", "throughput": 843.53, "total_tokens": 2955120} {"current_steps": 2270, "total_steps": 12855, "loss": 1.0807, "accuracy": 0.5, "learning_rate": 4.625069712778262e-05, "epoch": 0.17658498638661999, "percentage": 17.66, "elapsed_time": "0:58:46", "remaining_time": "4:34:06", "throughput": 842.41, "total_tokens": 2971120} {"current_steps": 2280, "total_steps": 12855, "loss": 0.948, "accuracy": 0.800000011920929, "learning_rate": 4.6218451761907916e-05, "epoch": 0.17736289381563594, "percentage": 17.74, "elapsed_time": "0:59:00", "remaining_time": "4:33:41", "throughput": 842.71, "total_tokens": 2983664} {"current_steps": 2290, "total_steps": 12855, "loss": 1.072, "accuracy": 0.800000011920929, "learning_rate": 4.618607966906093e-05, "epoch": 0.1781408012446519, "percentage": 17.81, "elapsed_time": "0:59:13", "remaining_time": "4:33:12", "throughput": 842.78, "total_tokens": 2994544} {"current_steps": 2300, "total_steps": 12855, "loss": 1.0113, "accuracy": 0.699999988079071, "learning_rate": 4.615358104258362e-05, "epoch": 0.17891870867366783, "percentage": 17.89, "elapsed_time": "0:59:29", "remaining_time": "4:32:59", "throughput": 842.58, "total_tokens": 3007296} {"current_steps": 2310, "total_steps": 12855, "loss": 0.8714, "accuracy": 1.0, "learning_rate": 4.612095607657368e-05, "epoch": 0.17969661610268378, "percentage": 17.97, "elapsed_time": "0:59:44", "remaining_time": "4:32:43", "throughput": 842.39, "total_tokens": 3019632} {"current_steps": 2320, "total_steps": 12855, "loss": 0.9708, "accuracy": 0.800000011920929, "learning_rate": 4.6088204965883374e-05, "epoch": 0.18047452353169974, "percentage": 18.05, "elapsed_time": "1:00:07", "remaining_time": "4:33:02", "throughput": 841.43, "total_tokens": 3035568} {"current_steps": 2330, "total_steps": 12855, "loss": 1.128, "accuracy": 0.699999988079071, "learning_rate": 4.605532790611834e-05, "epoch": 0.18125243096071567, "percentage": 18.13, "elapsed_time": "1:00:33", "remaining_time": "4:33:34", "throughput": 839.62, "total_tokens": 3050976} {"current_steps": 2340, "total_steps": 12855, "loss": 1.0032, "accuracy": 0.699999988079071, "learning_rate": 4.602232509363647e-05, "epoch": 0.18203033838973162, "percentage": 18.2, "elapsed_time": "1:00:59", "remaining_time": "4:34:03", "throughput": 838.56, "total_tokens": 3068576} {"current_steps": 2350, "total_steps": 12855, "loss": 0.9253, "accuracy": 0.8999999761581421, "learning_rate": 4.5989196725546704e-05, "epoch": 0.18280824581874758, "percentage": 18.28, "elapsed_time": "1:01:17", "remaining_time": "4:33:58", "throughput": 837.73, "total_tokens": 3080592} {"current_steps": 2360, "total_steps": 12855, "loss": 0.842, "accuracy": 0.699999988079071, "learning_rate": 4.595594299970786e-05, "epoch": 0.1835861532477635, "percentage": 18.36, "elapsed_time": "1:01:44", "remaining_time": "4:34:35", "throughput": 835.66, "total_tokens": 3096016} {"current_steps": 2370, "total_steps": 12855, "loss": 0.7966, "accuracy": 0.8999999761581421, "learning_rate": 4.592256411472744e-05, "epoch": 0.18436406067677946, "percentage": 18.44, "elapsed_time": "1:01:58", "remaining_time": "4:34:09", "throughput": 835.76, "total_tokens": 3107456} {"current_steps": 2380, "total_steps": 12855, "loss": 1.0393, "accuracy": 0.800000011920929, "learning_rate": 4.5889060269960484e-05, "epoch": 0.18514196810579542, "percentage": 18.51, "elapsed_time": "1:02:11", "remaining_time": "4:33:44", "throughput": 835.61, "total_tokens": 3118288} {"current_steps": 2390, "total_steps": 12855, "loss": 1.1342, "accuracy": 0.800000011920929, "learning_rate": 4.5855431665508345e-05, "epoch": 0.18591987553481135, "percentage": 18.59, "elapsed_time": "1:02:29", "remaining_time": "4:33:38", "throughput": 835.83, "total_tokens": 3134016} {"current_steps": 2400, "total_steps": 12855, "loss": 1.0009, "accuracy": 0.5, "learning_rate": 4.582167850221748e-05, "epoch": 0.1866977829638273, "percentage": 18.67, "elapsed_time": "1:02:44", "remaining_time": "4:33:17", "throughput": 835.93, "total_tokens": 3146544} {"current_steps": 2410, "total_steps": 12855, "loss": 0.7382, "accuracy": 0.800000011920929, "learning_rate": 4.5787800981678296e-05, "epoch": 0.18747569039284326, "percentage": 18.75, "elapsed_time": "1:03:12", "remaining_time": "4:33:54", "throughput": 834.43, "total_tokens": 3164224} {"current_steps": 2420, "total_steps": 12855, "loss": 1.1651, "accuracy": 0.6000000238418579, "learning_rate": 4.5753799306223925e-05, "epoch": 0.1882535978218592, "percentage": 18.83, "elapsed_time": "1:03:33", "remaining_time": "4:34:02", "throughput": 833.85, "total_tokens": 3179568} {"current_steps": 2430, "total_steps": 12855, "loss": 0.7549, "accuracy": 0.8999999761581421, "learning_rate": 4.5719673678929e-05, "epoch": 0.18903150525087514, "percentage": 18.9, "elapsed_time": "1:03:56", "remaining_time": "4:34:17", "throughput": 832.29, "total_tokens": 3192832} {"current_steps": 2440, "total_steps": 12855, "loss": 1.1856, "accuracy": 0.800000011920929, "learning_rate": 4.568542430360846e-05, "epoch": 0.1898094126798911, "percentage": 18.98, "elapsed_time": "1:04:08", "remaining_time": "4:33:48", "throughput": 832.5, "total_tokens": 3204080} {"current_steps": 2450, "total_steps": 12855, "loss": 1.2029, "accuracy": 0.8999999761581421, "learning_rate": 4.565105138481631e-05, "epoch": 0.19058732010890703, "percentage": 19.06, "elapsed_time": "1:04:30", "remaining_time": "4:33:57", "throughput": 831.55, "total_tokens": 3218432} {"current_steps": 2460, "total_steps": 12855, "loss": 0.7949, "accuracy": 0.800000011920929, "learning_rate": 4.5616555127844455e-05, "epoch": 0.19136522753792298, "percentage": 19.14, "elapsed_time": "1:04:47", "remaining_time": "4:33:48", "throughput": 831.18, "total_tokens": 3231408} {"current_steps": 2470, "total_steps": 12855, "loss": 1.091, "accuracy": 0.699999988079071, "learning_rate": 4.55819357387214e-05, "epoch": 0.19214313496693894, "percentage": 19.21, "elapsed_time": "1:05:01", "remaining_time": "4:33:22", "throughput": 831.5, "total_tokens": 3243872} {"current_steps": 2480, "total_steps": 12855, "loss": 0.9194, "accuracy": 0.6000000238418579, "learning_rate": 4.554719342421108e-05, "epoch": 0.1929210423959549, "percentage": 19.29, "elapsed_time": "1:05:14", "remaining_time": "4:32:56", "throughput": 831.58, "total_tokens": 3255296} {"current_steps": 2490, "total_steps": 12855, "loss": 1.0779, "accuracy": 0.8999999761581421, "learning_rate": 4.551232839181159e-05, "epoch": 0.19369894982497082, "percentage": 19.37, "elapsed_time": "1:05:42", "remaining_time": "4:33:32", "throughput": 830.23, "total_tokens": 3273408} {"current_steps": 2500, "total_steps": 12855, "loss": 0.9503, "accuracy": 0.8999999761581421, "learning_rate": 4.5477340849753944e-05, "epoch": 0.19447685725398678, "percentage": 19.45, "elapsed_time": "1:05:59", "remaining_time": "4:33:22", "throughput": 829.5, "total_tokens": 3284784} {"current_steps": 2510, "total_steps": 12855, "loss": 0.9709, "accuracy": 0.800000011920929, "learning_rate": 4.544223100700087e-05, "epoch": 0.19525476468300274, "percentage": 19.53, "elapsed_time": "1:06:20", "remaining_time": "4:33:27", "throughput": 828.68, "total_tokens": 3298928} {"current_steps": 2520, "total_steps": 12855, "loss": 1.0037, "accuracy": 0.800000011920929, "learning_rate": 4.540699907324552e-05, "epoch": 0.19603267211201866, "percentage": 19.6, "elapsed_time": "1:06:37", "remaining_time": "4:33:15", "throughput": 827.68, "total_tokens": 3308880} {"current_steps": 2530, "total_steps": 12855, "loss": 0.8472, "accuracy": 0.699999988079071, "learning_rate": 4.537164525891023e-05, "epoch": 0.19681057954103462, "percentage": 19.68, "elapsed_time": "1:07:03", "remaining_time": "4:33:41", "throughput": 826.29, "total_tokens": 3324896} {"current_steps": 2540, "total_steps": 12855, "loss": 0.9156, "accuracy": 0.8999999761581421, "learning_rate": 4.533616977514527e-05, "epoch": 0.19758848697005058, "percentage": 19.76, "elapsed_time": "1:07:28", "remaining_time": "4:33:59", "throughput": 825.35, "total_tokens": 3341072} {"current_steps": 2550, "total_steps": 12855, "loss": 0.6655, "accuracy": 1.0, "learning_rate": 4.530057283382759e-05, "epoch": 0.1983663943990665, "percentage": 19.84, "elapsed_time": "1:07:53", "remaining_time": "4:34:20", "throughput": 823.45, "total_tokens": 3354048} {"current_steps": 2560, "total_steps": 12855, "loss": 0.9926, "accuracy": 0.6000000238418579, "learning_rate": 4.5264854647559516e-05, "epoch": 0.19914430182808246, "percentage": 19.91, "elapsed_time": "1:08:10", "remaining_time": "4:34:10", "throughput": 823.23, "total_tokens": 3367584} {"current_steps": 2570, "total_steps": 12855, "loss": 0.8642, "accuracy": 0.699999988079071, "learning_rate": 4.522901542966756e-05, "epoch": 0.19992220925709842, "percentage": 19.99, "elapsed_time": "1:08:18", "remaining_time": "4:33:21", "throughput": 823.51, "total_tokens": 3375024} {"current_steps": 2580, "total_steps": 12855, "loss": 1.1658, "accuracy": 0.6000000238418579, "learning_rate": 4.5193055394201025e-05, "epoch": 0.20070011668611434, "percentage": 20.07, "elapsed_time": "1:08:33", "remaining_time": "4:33:03", "throughput": 823.41, "total_tokens": 3387376} {"current_steps": 2590, "total_steps": 12855, "loss": 0.909, "accuracy": 0.5, "learning_rate": 4.515697475593085e-05, "epoch": 0.2014780241151303, "percentage": 20.15, "elapsed_time": "1:08:58", "remaining_time": "4:33:21", "throughput": 822.54, "total_tokens": 3403952} {"current_steps": 2600, "total_steps": 12855, "loss": 0.8639, "accuracy": 0.800000011920929, "learning_rate": 4.512077373034825e-05, "epoch": 0.20225593154414626, "percentage": 20.23, "elapsed_time": "1:09:12", "remaining_time": "4:32:58", "throughput": 822.44, "total_tokens": 3415264} {"current_steps": 2610, "total_steps": 12855, "loss": 1.1177, "accuracy": 0.5, "learning_rate": 4.5084452533663466e-05, "epoch": 0.20303383897316218, "percentage": 20.3, "elapsed_time": "1:09:26", "remaining_time": "4:32:34", "throughput": 822.6, "total_tokens": 3427392} {"current_steps": 2620, "total_steps": 12855, "loss": 1.0858, "accuracy": 0.5, "learning_rate": 4.504801138280445e-05, "epoch": 0.20381174640217814, "percentage": 20.38, "elapsed_time": "1:09:43", "remaining_time": "4:32:24", "throughput": 822.43, "total_tokens": 3440992} {"current_steps": 2630, "total_steps": 12855, "loss": 1.008, "accuracy": 0.699999988079071, "learning_rate": 4.5011450495415555e-05, "epoch": 0.2045896538311941, "percentage": 20.46, "elapsed_time": "1:10:06", "remaining_time": "4:32:33", "throughput": 821.6, "total_tokens": 3455888} {"current_steps": 2640, "total_steps": 12855, "loss": 0.8501, "accuracy": 0.800000011920929, "learning_rate": 4.49747700898563e-05, "epoch": 0.20536756126021002, "percentage": 20.54, "elapsed_time": "1:10:31", "remaining_time": "4:32:53", "throughput": 820.69, "total_tokens": 3472864} {"current_steps": 2650, "total_steps": 12855, "loss": 0.9523, "accuracy": 0.8999999761581421, "learning_rate": 4.493797038520001e-05, "epoch": 0.20614546868922598, "percentage": 20.61, "elapsed_time": "1:10:51", "remaining_time": "4:32:53", "throughput": 820.18, "total_tokens": 3487200} {"current_steps": 2660, "total_steps": 12855, "loss": 1.1143, "accuracy": 0.800000011920929, "learning_rate": 4.4901051601232526e-05, "epoch": 0.20692337611824194, "percentage": 20.69, "elapsed_time": "1:11:10", "remaining_time": "4:32:48", "throughput": 820.08, "total_tokens": 3502288} {"current_steps": 2670, "total_steps": 12855, "loss": 1.1485, "accuracy": 0.800000011920929, "learning_rate": 4.4864013958450867e-05, "epoch": 0.20770128354725786, "percentage": 20.77, "elapsed_time": "1:11:35", "remaining_time": "4:33:06", "throughput": 818.97, "total_tokens": 3518000} {"current_steps": 2680, "total_steps": 12855, "loss": 1.1486, "accuracy": 0.6000000238418579, "learning_rate": 4.482685767806196e-05, "epoch": 0.20847919097627382, "percentage": 20.85, "elapsed_time": "1:11:51", "remaining_time": "4:32:48", "throughput": 818.43, "total_tokens": 3528432} {"current_steps": 2690, "total_steps": 12855, "loss": 1.0319, "accuracy": 0.800000011920929, "learning_rate": 4.4789582981981294e-05, "epoch": 0.20925709840528978, "percentage": 20.93, "elapsed_time": "1:12:05", "remaining_time": "4:32:26", "throughput": 818.25, "total_tokens": 3539520} {"current_steps": 2700, "total_steps": 12855, "loss": 0.8774, "accuracy": 0.8999999761581421, "learning_rate": 4.475219009283157e-05, "epoch": 0.2100350058343057, "percentage": 21.0, "elapsed_time": "1:12:26", "remaining_time": "4:32:26", "throughput": 817.7, "total_tokens": 3553856} {"current_steps": 2710, "total_steps": 12855, "loss": 0.8601, "accuracy": 0.8999999761581421, "learning_rate": 4.471467923394142e-05, "epoch": 0.21081291326332166, "percentage": 21.08, "elapsed_time": "1:12:52", "remaining_time": "4:32:49", "throughput": 815.66, "total_tokens": 3566720} {"current_steps": 2720, "total_steps": 12855, "loss": 0.7865, "accuracy": 0.8999999761581421, "learning_rate": 4.467705062934405e-05, "epoch": 0.21159082069233762, "percentage": 21.16, "elapsed_time": "1:13:06", "remaining_time": "4:32:26", "throughput": 815.84, "total_tokens": 3579088} {"current_steps": 2730, "total_steps": 12855, "loss": 0.8716, "accuracy": 0.699999988079071, "learning_rate": 4.463930450377587e-05, "epoch": 0.21236872812135357, "percentage": 21.24, "elapsed_time": "1:13:23", "remaining_time": "4:32:12", "throughput": 815.48, "total_tokens": 3591184} {"current_steps": 2740, "total_steps": 12855, "loss": 0.9273, "accuracy": 0.8999999761581421, "learning_rate": 4.460144108267522e-05, "epoch": 0.2131466355503695, "percentage": 21.31, "elapsed_time": "1:13:34", "remaining_time": "4:31:37", "throughput": 815.58, "total_tokens": 3600656} {"current_steps": 2750, "total_steps": 12855, "loss": 0.9811, "accuracy": 0.800000011920929, "learning_rate": 4.4563460592180966e-05, "epoch": 0.21392454297938546, "percentage": 21.39, "elapsed_time": "1:13:52", "remaining_time": "4:31:26", "throughput": 814.89, "total_tokens": 3611760} {"current_steps": 2760, "total_steps": 12855, "loss": 1.0853, "accuracy": 1.0, "learning_rate": 4.4525363259131175e-05, "epoch": 0.2147024504084014, "percentage": 21.47, "elapsed_time": "1:14:10", "remaining_time": "4:31:17", "throughput": 814.42, "total_tokens": 3624352} {"current_steps": 2770, "total_steps": 12855, "loss": 0.8297, "accuracy": 0.8999999761581421, "learning_rate": 4.4487149311061754e-05, "epoch": 0.21548035783741734, "percentage": 21.55, "elapsed_time": "1:14:25", "remaining_time": "4:30:57", "throughput": 814.41, "total_tokens": 3636736} {"current_steps": 2780, "total_steps": 12855, "loss": 0.9828, "accuracy": 0.800000011920929, "learning_rate": 4.444881897620509e-05, "epoch": 0.2162582652664333, "percentage": 21.63, "elapsed_time": "1:14:40", "remaining_time": "4:30:38", "throughput": 814.57, "total_tokens": 3649920} {"current_steps": 2790, "total_steps": 12855, "loss": 0.9442, "accuracy": 0.8999999761581421, "learning_rate": 4.441037248348869e-05, "epoch": 0.21703617269544925, "percentage": 21.7, "elapsed_time": "1:14:58", "remaining_time": "4:30:29", "throughput": 814.22, "total_tokens": 3662992} {"current_steps": 2800, "total_steps": 12855, "loss": 0.9668, "accuracy": 1.0, "learning_rate": 4.437181006253382e-05, "epoch": 0.21781408012446518, "percentage": 21.78, "elapsed_time": "1:15:12", "remaining_time": "4:30:04", "throughput": 814.26, "total_tokens": 3674288} {"current_steps": 2810, "total_steps": 12855, "loss": 1.0816, "accuracy": 0.6000000238418579, "learning_rate": 4.433313194365411e-05, "epoch": 0.21859198755348114, "percentage": 21.86, "elapsed_time": "1:15:25", "remaining_time": "4:29:38", "throughput": 813.89, "total_tokens": 3683472} {"current_steps": 2820, "total_steps": 12855, "loss": 1.1106, "accuracy": 0.5, "learning_rate": 4.429433835785422e-05, "epoch": 0.2193698949824971, "percentage": 21.94, "elapsed_time": "1:15:42", "remaining_time": "4:29:24", "throughput": 813.63, "total_tokens": 3695840} {"current_steps": 2830, "total_steps": 12855, "loss": 0.9, "accuracy": 0.8999999761581421, "learning_rate": 4.425542953682841e-05, "epoch": 0.22014780241151302, "percentage": 22.01, "elapsed_time": "1:16:03", "remaining_time": "4:29:26", "throughput": 812.88, "total_tokens": 3709792} {"current_steps": 2840, "total_steps": 12855, "loss": 1.1238, "accuracy": 0.699999988079071, "learning_rate": 4.421640571295918e-05, "epoch": 0.22092570984052898, "percentage": 22.09, "elapsed_time": "1:16:18", "remaining_time": "4:29:04", "throughput": 812.91, "total_tokens": 3721664} {"current_steps": 2850, "total_steps": 12855, "loss": 0.9641, "accuracy": 0.6000000238418579, "learning_rate": 4.4177267119315905e-05, "epoch": 0.22170361726954493, "percentage": 22.17, "elapsed_time": "1:16:28", "remaining_time": "4:28:28", "throughput": 812.86, "total_tokens": 3729968} {"current_steps": 2860, "total_steps": 12855, "loss": 0.886, "accuracy": 0.699999988079071, "learning_rate": 4.4138013989653406e-05, "epoch": 0.22248152469856086, "percentage": 22.25, "elapsed_time": "1:16:47", "remaining_time": "4:28:21", "throughput": 812.72, "total_tokens": 3744544} {"current_steps": 2870, "total_steps": 12855, "loss": 1.1547, "accuracy": 0.8999999761581421, "learning_rate": 4.409864655841058e-05, "epoch": 0.22325943212757682, "percentage": 22.33, "elapsed_time": "1:17:11", "remaining_time": "4:28:32", "throughput": 811.91, "total_tokens": 3760112} {"current_steps": 2880, "total_steps": 12855, "loss": 0.7769, "accuracy": 0.699999988079071, "learning_rate": 4.405916506070897e-05, "epoch": 0.22403733955659277, "percentage": 22.4, "elapsed_time": "1:17:36", "remaining_time": "4:28:47", "throughput": 810.51, "total_tokens": 3774064} {"current_steps": 2890, "total_steps": 12855, "loss": 0.9157, "accuracy": 0.699999988079071, "learning_rate": 4.40195697323514e-05, "epoch": 0.2248152469856087, "percentage": 22.48, "elapsed_time": "1:17:54", "remaining_time": "4:28:37", "throughput": 810.21, "total_tokens": 3787120} {"current_steps": 2900, "total_steps": 12855, "loss": 0.8606, "accuracy": 0.699999988079071, "learning_rate": 4.397986080982053e-05, "epoch": 0.22559315441462466, "percentage": 22.56, "elapsed_time": "1:18:07", "remaining_time": "4:28:12", "throughput": 810.18, "total_tokens": 3797968} {"current_steps": 2910, "total_steps": 12855, "loss": 0.7953, "accuracy": 0.800000011920929, "learning_rate": 4.394003853027748e-05, "epoch": 0.22637106184364061, "percentage": 22.64, "elapsed_time": "1:18:29", "remaining_time": "4:28:13", "throughput": 809.52, "total_tokens": 3812112} {"current_steps": 2920, "total_steps": 12855, "loss": 0.8429, "accuracy": 0.8999999761581421, "learning_rate": 4.3900103131560376e-05, "epoch": 0.22714896927265654, "percentage": 22.71, "elapsed_time": "1:18:44", "remaining_time": "4:27:53", "throughput": 809.63, "total_tokens": 3824768} {"current_steps": 2930, "total_steps": 12855, "loss": 0.9075, "accuracy": 0.800000011920929, "learning_rate": 4.386005485218294e-05, "epoch": 0.2279268767016725, "percentage": 22.79, "elapsed_time": "1:18:59", "remaining_time": "4:27:32", "throughput": 809.65, "total_tokens": 3836960} {"current_steps": 2940, "total_steps": 12855, "loss": 0.8842, "accuracy": 0.800000011920929, "learning_rate": 4.3819893931333106e-05, "epoch": 0.22870478413068845, "percentage": 22.87, "elapsed_time": "1:19:17", "remaining_time": "4:27:24", "throughput": 809.8, "total_tokens": 3852752} {"current_steps": 2950, "total_steps": 12855, "loss": 1.0918, "accuracy": 0.800000011920929, "learning_rate": 4.3779620608871526e-05, "epoch": 0.22948269155970438, "percentage": 22.95, "elapsed_time": "1:19:27", "remaining_time": "4:26:49", "throughput": 810.23, "total_tokens": 3863120} {"current_steps": 2960, "total_steps": 12855, "loss": 1.0268, "accuracy": 1.0, "learning_rate": 4.373923512533018e-05, "epoch": 0.23026059898872034, "percentage": 23.03, "elapsed_time": "1:19:42", "remaining_time": "4:26:27", "throughput": 810.56, "total_tokens": 3876384} {"current_steps": 2970, "total_steps": 12855, "loss": 1.0257, "accuracy": 0.8999999761581421, "learning_rate": 4.369873772191092e-05, "epoch": 0.2310385064177363, "percentage": 23.1, "elapsed_time": "1:19:54", "remaining_time": "4:25:57", "throughput": 810.72, "total_tokens": 3887008} {"current_steps": 2980, "total_steps": 12855, "loss": 1.0754, "accuracy": 0.6000000238418579, "learning_rate": 4.365812864048407e-05, "epoch": 0.23181641384675222, "percentage": 23.18, "elapsed_time": "1:20:12", "remaining_time": "4:25:46", "throughput": 810.89, "total_tokens": 3902128} {"current_steps": 2990, "total_steps": 12855, "loss": 1.1817, "accuracy": 0.8999999761581421, "learning_rate": 4.3617408123586913e-05, "epoch": 0.23259432127576818, "percentage": 23.26, "elapsed_time": "1:20:41", "remaining_time": "4:26:14", "throughput": 809.15, "total_tokens": 3917712} {"current_steps": 3000, "total_steps": 12855, "loss": 1.0064, "accuracy": 0.800000011920929, "learning_rate": 4.357657641442229e-05, "epoch": 0.23337222870478413, "percentage": 23.34, "elapsed_time": "1:20:59", "remaining_time": "4:26:02", "throughput": 808.87, "total_tokens": 3930480} {"current_steps": 3010, "total_steps": 12855, "loss": 0.9786, "accuracy": 0.8999999761581421, "learning_rate": 4.3535633756857136e-05, "epoch": 0.2341501361338001, "percentage": 23.42, "elapsed_time": "1:21:21", "remaining_time": "4:26:04", "throughput": 807.1, "total_tokens": 3939456} {"current_steps": 3020, "total_steps": 12855, "loss": 1.1815, "accuracy": 0.8999999761581421, "learning_rate": 4.349458039542105e-05, "epoch": 0.23492804356281602, "percentage": 23.49, "elapsed_time": "1:21:34", "remaining_time": "4:25:38", "throughput": 806.85, "total_tokens": 3948896} {"current_steps": 3030, "total_steps": 12855, "loss": 0.8875, "accuracy": 0.800000011920929, "learning_rate": 4.345341657530476e-05, "epoch": 0.23570595099183198, "percentage": 23.57, "elapsed_time": "1:22:11", "remaining_time": "4:26:29", "throughput": 803.68, "total_tokens": 3963056} {"current_steps": 3040, "total_steps": 12855, "loss": 1.0336, "accuracy": 0.8999999761581421, "learning_rate": 4.3412142542358746e-05, "epoch": 0.23648385842084793, "percentage": 23.65, "elapsed_time": "1:22:25", "remaining_time": "4:26:05", "throughput": 803.55, "total_tokens": 3973632} {"current_steps": 3050, "total_steps": 12855, "loss": 1.0508, "accuracy": 0.800000011920929, "learning_rate": 4.3370758543091735e-05, "epoch": 0.23726176584986386, "percentage": 23.73, "elapsed_time": "1:22:36", "remaining_time": "4:25:34", "throughput": 803.64, "total_tokens": 3983488} {"current_steps": 3060, "total_steps": 12855, "loss": 0.8586, "accuracy": 0.699999988079071, "learning_rate": 4.332926482466919e-05, "epoch": 0.23803967327887982, "percentage": 23.8, "elapsed_time": "1:22:48", "remaining_time": "4:25:04", "throughput": 803.7, "total_tokens": 3993264} {"current_steps": 3070, "total_steps": 12855, "loss": 1.0565, "accuracy": 0.8999999761581421, "learning_rate": 4.32876616349119e-05, "epoch": 0.23881758070789577, "percentage": 23.88, "elapsed_time": "1:23:02", "remaining_time": "4:24:41", "throughput": 804.04, "total_tokens": 4006208} {"current_steps": 3080, "total_steps": 12855, "loss": 1.0042, "accuracy": 0.699999988079071, "learning_rate": 4.3245949222294466e-05, "epoch": 0.2395954881369117, "percentage": 23.96, "elapsed_time": "1:23:17", "remaining_time": "4:24:21", "throughput": 804.3, "total_tokens": 4019776} {"current_steps": 3090, "total_steps": 12855, "loss": 0.9954, "accuracy": 1.0, "learning_rate": 4.320412783594381e-05, "epoch": 0.24037339556592766, "percentage": 24.04, "elapsed_time": "1:23:32", "remaining_time": "4:23:59", "throughput": 804.45, "total_tokens": 4031968} {"current_steps": 3100, "total_steps": 12855, "loss": 0.9118, "accuracy": 0.800000011920929, "learning_rate": 4.316219772563772e-05, "epoch": 0.2411513029949436, "percentage": 24.12, "elapsed_time": "1:23:46", "remaining_time": "4:23:35", "throughput": 804.73, "total_tokens": 4044592} {"current_steps": 3110, "total_steps": 12855, "loss": 0.9622, "accuracy": 0.8999999761581421, "learning_rate": 4.312015914180332e-05, "epoch": 0.24192921042395954, "percentage": 24.19, "elapsed_time": "1:24:03", "remaining_time": "4:23:22", "throughput": 804.28, "total_tokens": 4056096} {"current_steps": 3120, "total_steps": 12855, "loss": 1.0044, "accuracy": 0.699999988079071, "learning_rate": 4.307801233551558e-05, "epoch": 0.2427071178529755, "percentage": 24.27, "elapsed_time": "1:24:20", "remaining_time": "4:23:09", "throughput": 803.92, "total_tokens": 4068272} {"current_steps": 3130, "total_steps": 12855, "loss": 1.1389, "accuracy": 0.8999999761581421, "learning_rate": 4.303575755849587e-05, "epoch": 0.24348502528199145, "percentage": 24.35, "elapsed_time": "1:24:34", "remaining_time": "4:22:47", "throughput": 803.9, "total_tokens": 4079664} {"current_steps": 3140, "total_steps": 12855, "loss": 0.9769, "accuracy": 0.699999988079071, "learning_rate": 4.2993395063110365e-05, "epoch": 0.24426293271100738, "percentage": 24.43, "elapsed_time": "1:24:53", "remaining_time": "4:22:37", "throughput": 803.92, "total_tokens": 4094448} {"current_steps": 3150, "total_steps": 12855, "loss": 1.1078, "accuracy": 0.800000011920929, "learning_rate": 4.2950925102368605e-05, "epoch": 0.24504084014002334, "percentage": 24.5, "elapsed_time": "1:25:09", "remaining_time": "4:22:21", "throughput": 804.09, "total_tokens": 4108192} {"current_steps": 3160, "total_steps": 12855, "loss": 0.8765, "accuracy": 0.800000011920929, "learning_rate": 4.290834792992198e-05, "epoch": 0.2458187475690393, "percentage": 24.58, "elapsed_time": "1:25:52", "remaining_time": "4:23:28", "throughput": 800.97, "total_tokens": 4127088} {"current_steps": 3170, "total_steps": 12855, "loss": 0.9898, "accuracy": 0.8999999761581421, "learning_rate": 4.286566380006218e-05, "epoch": 0.24659665499805522, "percentage": 24.66, "elapsed_time": "1:26:17", "remaining_time": "4:23:39", "throughput": 799.73, "total_tokens": 4140960} {"current_steps": 3180, "total_steps": 12855, "loss": 1.0286, "accuracy": 0.6000000238418579, "learning_rate": 4.282287296771972e-05, "epoch": 0.24737456242707118, "percentage": 24.74, "elapsed_time": "1:26:41", "remaining_time": "4:23:44", "throughput": 799.04, "total_tokens": 4155904} {"current_steps": 3190, "total_steps": 12855, "loss": 0.9598, "accuracy": 0.800000011920929, "learning_rate": 4.277997568846237e-05, "epoch": 0.24815246985608713, "percentage": 24.82, "elapsed_time": "1:27:09", "remaining_time": "4:24:03", "throughput": 798.37, "total_tokens": 4174832} {"current_steps": 3200, "total_steps": 12855, "loss": 1.0203, "accuracy": 0.800000011920929, "learning_rate": 4.2736972218493664e-05, "epoch": 0.24893037728510306, "percentage": 24.89, "elapsed_time": "1:27:35", "remaining_time": "4:24:17", "throughput": 797.46, "total_tokens": 4191232} {"current_steps": 3210, "total_steps": 12855, "loss": 1.0954, "accuracy": 0.6000000238418579, "learning_rate": 4.269386281465136e-05, "epoch": 0.24970828471411902, "percentage": 24.97, "elapsed_time": "1:27:50", "remaining_time": "4:23:57", "throughput": 797.71, "total_tokens": 4204640} {"current_steps": 3220, "total_steps": 12855, "loss": 1.0289, "accuracy": 0.699999988079071, "learning_rate": 4.2650647734405914e-05, "epoch": 0.25048619214313494, "percentage": 25.05, "elapsed_time": "1:28:10", "remaining_time": "4:23:50", "throughput": 797.81, "total_tokens": 4220752} {"current_steps": 3230, "total_steps": 12855, "loss": 0.9947, "accuracy": 0.8999999761581421, "learning_rate": 4.2607327235858894e-05, "epoch": 0.2512640995721509, "percentage": 25.13, "elapsed_time": "1:28:26", "remaining_time": "4:23:32", "throughput": 797.89, "total_tokens": 4233920} {"current_steps": 3240, "total_steps": 12855, "loss": 1.0714, "accuracy": 1.0, "learning_rate": 4.256390157774154e-05, "epoch": 0.25204200700116686, "percentage": 25.2, "elapsed_time": "1:28:37", "remaining_time": "4:23:01", "throughput": 798.05, "total_tokens": 4243920} {"current_steps": 3250, "total_steps": 12855, "loss": 1.0548, "accuracy": 0.6000000238418579, "learning_rate": 4.2520371019413095e-05, "epoch": 0.2528199144301828, "percentage": 25.28, "elapsed_time": "1:28:52", "remaining_time": "4:22:40", "throughput": 798.09, "total_tokens": 4256112} {"current_steps": 3260, "total_steps": 12855, "loss": 1.1476, "accuracy": 0.6000000238418579, "learning_rate": 4.2476735820859374e-05, "epoch": 0.25359782185919877, "percentage": 25.36, "elapsed_time": "1:29:09", "remaining_time": "4:22:24", "throughput": 798.3, "total_tokens": 4270368} {"current_steps": 3270, "total_steps": 12855, "loss": 0.9217, "accuracy": 0.800000011920929, "learning_rate": 4.2432996242691095e-05, "epoch": 0.2543757292882147, "percentage": 25.44, "elapsed_time": "1:29:25", "remaining_time": "4:22:06", "throughput": 798.38, "total_tokens": 4283568} {"current_steps": 3280, "total_steps": 12855, "loss": 1.2814, "accuracy": 0.699999988079071, "learning_rate": 4.238915254614243e-05, "epoch": 0.2551536367172306, "percentage": 25.52, "elapsed_time": "1:29:38", "remaining_time": "4:21:42", "throughput": 798.12, "total_tokens": 4293056} {"current_steps": 3290, "total_steps": 12855, "loss": 0.8583, "accuracy": 0.8999999761581421, "learning_rate": 4.2345204993069376e-05, "epoch": 0.2559315441462466, "percentage": 25.59, "elapsed_time": "1:29:59", "remaining_time": "4:21:37", "throughput": 797.8, "total_tokens": 4307728} {"current_steps": 3300, "total_steps": 12855, "loss": 0.8122, "accuracy": 0.8999999761581421, "learning_rate": 4.230115384594821e-05, "epoch": 0.25670945157526254, "percentage": 25.67, "elapsed_time": "1:30:18", "remaining_time": "4:21:29", "throughput": 797.39, "total_tokens": 4320736} {"current_steps": 3310, "total_steps": 12855, "loss": 0.8513, "accuracy": 0.800000011920929, "learning_rate": 4.225699936787394e-05, "epoch": 0.2574873590042785, "percentage": 25.75, "elapsed_time": "1:30:30", "remaining_time": "4:20:58", "throughput": 797.86, "total_tokens": 4332432} {"current_steps": 3320, "total_steps": 12855, "loss": 1.0142, "accuracy": 0.8999999761581421, "learning_rate": 4.22127418225587e-05, "epoch": 0.25826526643329445, "percentage": 25.83, "elapsed_time": "1:30:48", "remaining_time": "4:20:48", "throughput": 798.12, "total_tokens": 4348576} {"current_steps": 3330, "total_steps": 12855, "loss": 0.8378, "accuracy": 0.800000011920929, "learning_rate": 4.21683814743302e-05, "epoch": 0.2590431738623104, "percentage": 25.9, "elapsed_time": "1:31:03", "remaining_time": "4:20:27", "throughput": 798.31, "total_tokens": 4361584} {"current_steps": 3340, "total_steps": 12855, "loss": 0.9238, "accuracy": 1.0, "learning_rate": 4.212391858813013e-05, "epoch": 0.2598210812913263, "percentage": 25.98, "elapsed_time": "1:31:13", "remaining_time": "4:19:52", "throughput": 798.88, "total_tokens": 4372672} {"current_steps": 3350, "total_steps": 12855, "loss": 1.11, "accuracy": 0.8999999761581421, "learning_rate": 4.207935342951261e-05, "epoch": 0.26059898872034226, "percentage": 26.06, "elapsed_time": "1:31:28", "remaining_time": "4:19:33", "throughput": 798.49, "total_tokens": 4382704} {"current_steps": 3360, "total_steps": 12855, "loss": 0.8993, "accuracy": 0.699999988079071, "learning_rate": 4.203468626464254e-05, "epoch": 0.2613768961493582, "percentage": 26.14, "elapsed_time": "1:31:52", "remaining_time": "4:19:36", "throughput": 797.22, "total_tokens": 4394320} {"current_steps": 3370, "total_steps": 12855, "loss": 1.1625, "accuracy": 0.8999999761581421, "learning_rate": 4.1989917360294106e-05, "epoch": 0.2621548035783742, "percentage": 26.22, "elapsed_time": "1:32:01", "remaining_time": "4:19:01", "throughput": 797.12, "total_tokens": 4401664} {"current_steps": 3380, "total_steps": 12855, "loss": 1.184, "accuracy": 1.0, "learning_rate": 4.194504698384908e-05, "epoch": 0.26293271100739013, "percentage": 26.29, "elapsed_time": "1:32:21", "remaining_time": "4:18:55", "throughput": 796.46, "total_tokens": 4413920} {"current_steps": 3390, "total_steps": 12855, "loss": 0.9663, "accuracy": 0.800000011920929, "learning_rate": 4.1900075403295304e-05, "epoch": 0.2637106184364061, "percentage": 26.37, "elapsed_time": "1:32:37", "remaining_time": "4:18:37", "throughput": 796.12, "total_tokens": 4424784} {"current_steps": 3400, "total_steps": 12855, "loss": 0.7776, "accuracy": 1.0, "learning_rate": 4.185500288722505e-05, "epoch": 0.26448852586542204, "percentage": 26.45, "elapsed_time": "1:32:47", "remaining_time": "4:18:01", "throughput": 796.38, "total_tokens": 4433632} {"current_steps": 3410, "total_steps": 12855, "loss": 0.9434, "accuracy": 0.800000011920929, "learning_rate": 4.180982970483344e-05, "epoch": 0.26526643329443794, "percentage": 26.53, "elapsed_time": "1:33:02", "remaining_time": "4:17:43", "throughput": 796.41, "total_tokens": 4446192} {"current_steps": 3420, "total_steps": 12855, "loss": 0.7579, "accuracy": 0.8999999761581421, "learning_rate": 4.176455612591681e-05, "epoch": 0.2660443407234539, "percentage": 26.6, "elapsed_time": "1:33:16", "remaining_time": "4:17:19", "throughput": 796.33, "total_tokens": 4456784} {"current_steps": 3430, "total_steps": 12855, "loss": 1.0241, "accuracy": 0.8999999761581421, "learning_rate": 4.1719182420871104e-05, "epoch": 0.26682224815246985, "percentage": 26.68, "elapsed_time": "1:33:30", "remaining_time": "4:16:57", "throughput": 796.43, "total_tokens": 4468704} {"current_steps": 3440, "total_steps": 12855, "loss": 0.9317, "accuracy": 0.800000011920929, "learning_rate": 4.16737088606903e-05, "epoch": 0.2676001555814858, "percentage": 26.76, "elapsed_time": "1:33:45", "remaining_time": "4:16:35", "throughput": 796.44, "total_tokens": 4480144} {"current_steps": 3450, "total_steps": 12855, "loss": 0.9583, "accuracy": 0.800000011920929, "learning_rate": 4.1628135716964734e-05, "epoch": 0.26837806301050177, "percentage": 26.84, "elapsed_time": "1:33:59", "remaining_time": "4:16:14", "throughput": 796.74, "total_tokens": 4493504} {"current_steps": 3460, "total_steps": 12855, "loss": 0.9748, "accuracy": 0.800000011920929, "learning_rate": 4.158246326187951e-05, "epoch": 0.2691559704395177, "percentage": 26.92, "elapsed_time": "1:34:20", "remaining_time": "4:16:10", "throughput": 796.25, "total_tokens": 4507200} {"current_steps": 3470, "total_steps": 12855, "loss": 1.2102, "accuracy": 0.8999999761581421, "learning_rate": 4.153669176821288e-05, "epoch": 0.2699338778685336, "percentage": 26.99, "elapsed_time": "1:34:37", "remaining_time": "4:15:56", "throughput": 795.98, "total_tokens": 4519392} {"current_steps": 3480, "total_steps": 12855, "loss": 1.0537, "accuracy": 0.800000011920929, "learning_rate": 4.149082150933456e-05, "epoch": 0.2707117852975496, "percentage": 27.07, "elapsed_time": "1:34:54", "remaining_time": "4:15:41", "throughput": 795.82, "total_tokens": 4531984} {"current_steps": 3490, "total_steps": 12855, "loss": 1.2139, "accuracy": 0.6000000238418579, "learning_rate": 4.144485275920422e-05, "epoch": 0.27148969272656553, "percentage": 27.15, "elapsed_time": "1:35:29", "remaining_time": "4:16:15", "throughput": 793.71, "total_tokens": 4547792} {"current_steps": 3500, "total_steps": 12855, "loss": 1.1075, "accuracy": 0.8999999761581421, "learning_rate": 4.1398785792369676e-05, "epoch": 0.2722676001555815, "percentage": 27.23, "elapsed_time": "1:35:44", "remaining_time": "4:15:55", "throughput": 793.74, "total_tokens": 4560016} {"current_steps": 3510, "total_steps": 12855, "loss": 1.0274, "accuracy": 1.0, "learning_rate": 4.135262088396542e-05, "epoch": 0.27304550758459745, "percentage": 27.3, "elapsed_time": "1:36:01", "remaining_time": "4:15:40", "throughput": 793.76, "total_tokens": 4573536} {"current_steps": 3520, "total_steps": 12855, "loss": 0.931, "accuracy": 0.800000011920929, "learning_rate": 4.130635830971084e-05, "epoch": 0.2738234150136134, "percentage": 27.38, "elapsed_time": "1:36:29", "remaining_time": "4:15:52", "throughput": 793.36, "total_tokens": 4592768} {"current_steps": 3530, "total_steps": 12855, "loss": 1.7911, "accuracy": 0.4000000059604645, "learning_rate": 4.125999834590867e-05, "epoch": 0.2746013224426293, "percentage": 27.46, "elapsed_time": "1:36:38", "remaining_time": "4:15:18", "throughput": 793.68, "total_tokens": 4602480} {"current_steps": 3540, "total_steps": 12855, "loss": 1.0487, "accuracy": 0.8999999761581421, "learning_rate": 4.121354126944329e-05, "epoch": 0.27537922987164526, "percentage": 27.54, "elapsed_time": "1:36:57", "remaining_time": "4:15:08", "throughput": 793.24, "total_tokens": 4614832} {"current_steps": 3550, "total_steps": 12855, "loss": 0.8017, "accuracy": 0.800000011920929, "learning_rate": 4.116698735777907e-05, "epoch": 0.2761571373006612, "percentage": 27.62, "elapsed_time": "1:37:14", "remaining_time": "4:14:53", "throughput": 792.9, "total_tokens": 4626304} {"current_steps": 3560, "total_steps": 12855, "loss": 0.9514, "accuracy": 0.699999988079071, "learning_rate": 4.1120336888958766e-05, "epoch": 0.27693504472967717, "percentage": 27.69, "elapsed_time": "1:37:31", "remaining_time": "4:14:37", "throughput": 792.76, "total_tokens": 4638624} {"current_steps": 3570, "total_steps": 12855, "loss": 1.0792, "accuracy": 1.0, "learning_rate": 4.107359014160177e-05, "epoch": 0.2777129521586931, "percentage": 27.77, "elapsed_time": "1:37:40", "remaining_time": "4:14:02", "throughput": 792.96, "total_tokens": 4647168} {"current_steps": 3580, "total_steps": 12855, "loss": 1.0222, "accuracy": 0.699999988079071, "learning_rate": 4.102674739490254e-05, "epoch": 0.2784908595877091, "percentage": 27.85, "elapsed_time": "1:37:57", "remaining_time": "4:13:46", "throughput": 792.77, "total_tokens": 4659312} {"current_steps": 3590, "total_steps": 12855, "loss": 0.923, "accuracy": 0.8999999761581421, "learning_rate": 4.097980892862886e-05, "epoch": 0.279268767016725, "percentage": 27.93, "elapsed_time": "1:38:20", "remaining_time": "4:13:48", "throughput": 792.25, "total_tokens": 4674992} {"current_steps": 3600, "total_steps": 12855, "loss": 1.0698, "accuracy": 0.8999999761581421, "learning_rate": 4.093277502312022e-05, "epoch": 0.28004667444574094, "percentage": 28.0, "elapsed_time": "1:38:31", "remaining_time": "4:13:17", "throughput": 792.45, "total_tokens": 4684448} {"current_steps": 3610, "total_steps": 12855, "loss": 1.3427, "accuracy": 0.5, "learning_rate": 4.088564595928609e-05, "epoch": 0.2808245818747569, "percentage": 28.08, "elapsed_time": "1:38:43", "remaining_time": "4:12:48", "throughput": 792.73, "total_tokens": 4695472} {"current_steps": 3620, "total_steps": 12855, "loss": 1.1047, "accuracy": 0.8999999761581421, "learning_rate": 4.083842201860431e-05, "epoch": 0.28160248930377285, "percentage": 28.16, "elapsed_time": "1:39:01", "remaining_time": "4:12:36", "throughput": 792.59, "total_tokens": 4708896} {"current_steps": 3630, "total_steps": 12855, "loss": 0.9384, "accuracy": 0.8999999761581421, "learning_rate": 4.079110348311934e-05, "epoch": 0.2823803967327888, "percentage": 28.24, "elapsed_time": "1:39:23", "remaining_time": "4:12:33", "throughput": 792.11, "total_tokens": 4723376} {"current_steps": 3640, "total_steps": 12855, "loss": 0.9396, "accuracy": 0.8999999761581421, "learning_rate": 4.0743690635440634e-05, "epoch": 0.28315830416180476, "percentage": 28.32, "elapsed_time": "1:39:36", "remaining_time": "4:12:09", "throughput": 792.28, "total_tokens": 4734944} {"current_steps": 3650, "total_steps": 12855, "loss": 0.9965, "accuracy": 1.0, "learning_rate": 4.0696183758740894e-05, "epoch": 0.2839362115908207, "percentage": 28.39, "elapsed_time": "1:39:56", "remaining_time": "4:12:02", "throughput": 791.92, "total_tokens": 4748816} {"current_steps": 3660, "total_steps": 12855, "loss": 1.0673, "accuracy": 0.800000011920929, "learning_rate": 4.064858313675443e-05, "epoch": 0.2847141190198366, "percentage": 28.47, "elapsed_time": "1:40:13", "remaining_time": "4:11:47", "throughput": 791.97, "total_tokens": 4762544} {"current_steps": 3670, "total_steps": 12855, "loss": 1.0629, "accuracy": 0.800000011920929, "learning_rate": 4.060088905377543e-05, "epoch": 0.2854920264488526, "percentage": 28.55, "elapsed_time": "1:40:34", "remaining_time": "4:11:43", "throughput": 791.81, "total_tokens": 4778464} {"current_steps": 3680, "total_steps": 12855, "loss": 0.9816, "accuracy": 0.8999999761581421, "learning_rate": 4.05531017946563e-05, "epoch": 0.28626993387786853, "percentage": 28.63, "elapsed_time": "1:40:55", "remaining_time": "4:11:38", "throughput": 791.09, "total_tokens": 4790656} {"current_steps": 3690, "total_steps": 12855, "loss": 1.011, "accuracy": 0.800000011920929, "learning_rate": 4.0505221644805915e-05, "epoch": 0.2870478413068845, "percentage": 28.7, "elapsed_time": "1:41:20", "remaining_time": "4:11:43", "throughput": 789.91, "total_tokens": 4803440} {"current_steps": 3700, "total_steps": 12855, "loss": 0.9823, "accuracy": 0.800000011920929, "learning_rate": 4.045724889018795e-05, "epoch": 0.28782574873590044, "percentage": 28.78, "elapsed_time": "1:41:45", "remaining_time": "4:11:46", "throughput": 789.09, "total_tokens": 4817680} {"current_steps": 3710, "total_steps": 12855, "loss": 1.3073, "accuracy": 0.6000000238418579, "learning_rate": 4.040918381731916e-05, "epoch": 0.2886036561649164, "percentage": 28.86, "elapsed_time": "1:42:04", "remaining_time": "4:11:36", "throughput": 788.79, "total_tokens": 4830976} {"current_steps": 3720, "total_steps": 12855, "loss": 0.8937, "accuracy": 0.8999999761581421, "learning_rate": 4.036102671326768e-05, "epoch": 0.2893815635939323, "percentage": 28.94, "elapsed_time": "1:42:13", "remaining_time": "4:11:02", "throughput": 789.0, "total_tokens": 4839504} {"current_steps": 3730, "total_steps": 12855, "loss": 0.971, "accuracy": 0.699999988079071, "learning_rate": 4.031277786565128e-05, "epoch": 0.29015947102294826, "percentage": 29.02, "elapsed_time": "1:42:29", "remaining_time": "4:10:43", "throughput": 788.96, "total_tokens": 4851552} {"current_steps": 3740, "total_steps": 12855, "loss": 0.8648, "accuracy": 0.6000000238418579, "learning_rate": 4.0264437562635674e-05, "epoch": 0.2909373784519642, "percentage": 29.09, "elapsed_time": "1:42:40", "remaining_time": "4:10:13", "throughput": 789.15, "total_tokens": 4861456} {"current_steps": 3750, "total_steps": 12855, "loss": 0.7778, "accuracy": 0.8999999761581421, "learning_rate": 4.0216006092932815e-05, "epoch": 0.29171528588098017, "percentage": 29.17, "elapsed_time": "1:42:55", "remaining_time": "4:09:54", "throughput": 788.89, "total_tokens": 4872080} {"current_steps": 3760, "total_steps": 12855, "loss": 0.9672, "accuracy": 0.6000000238418579, "learning_rate": 4.01674837457991e-05, "epoch": 0.2924931933099961, "percentage": 29.25, "elapsed_time": "1:43:06", "remaining_time": "4:09:23", "throughput": 789.04, "total_tokens": 4881072} {"current_steps": 3770, "total_steps": 12855, "loss": 0.9834, "accuracy": 0.8999999761581421, "learning_rate": 4.011887081103374e-05, "epoch": 0.2932711007390121, "percentage": 29.33, "elapsed_time": "1:43:19", "remaining_time": "4:08:58", "throughput": 789.02, "total_tokens": 4891296} {"current_steps": 3780, "total_steps": 12855, "loss": 1.0289, "accuracy": 0.6000000238418579, "learning_rate": 4.007016757897696e-05, "epoch": 0.294049008168028, "percentage": 29.4, "elapsed_time": "1:43:39", "remaining_time": "4:08:52", "throughput": 788.5, "total_tokens": 4904416} {"current_steps": 3790, "total_steps": 12855, "loss": 1.0588, "accuracy": 0.8999999761581421, "learning_rate": 4.0021374340508266e-05, "epoch": 0.29482691559704394, "percentage": 29.48, "elapsed_time": "1:43:58", "remaining_time": "4:08:40", "throughput": 788.02, "total_tokens": 4915760} {"current_steps": 3800, "total_steps": 12855, "loss": 1.0018, "accuracy": 0.8999999761581421, "learning_rate": 3.997249138704476e-05, "epoch": 0.2956048230260599, "percentage": 29.56, "elapsed_time": "1:44:13", "remaining_time": "4:08:20", "throughput": 788.18, "total_tokens": 4928688} {"current_steps": 3810, "total_steps": 12855, "loss": 0.9906, "accuracy": 0.699999988079071, "learning_rate": 3.992351901053934e-05, "epoch": 0.29638273045507585, "percentage": 29.64, "elapsed_time": "1:44:29", "remaining_time": "4:08:03", "throughput": 788.42, "total_tokens": 4942880} {"current_steps": 3820, "total_steps": 12855, "loss": 1.1504, "accuracy": 0.8999999761581421, "learning_rate": 3.9874457503479e-05, "epoch": 0.2971606378840918, "percentage": 29.72, "elapsed_time": "1:44:42", "remaining_time": "4:07:38", "throughput": 788.7, "total_tokens": 4954816} {"current_steps": 3830, "total_steps": 12855, "loss": 1.2595, "accuracy": 1.0, "learning_rate": 3.982530715888306e-05, "epoch": 0.29793854531310776, "percentage": 29.79, "elapsed_time": "1:44:53", "remaining_time": "4:07:10", "throughput": 788.99, "total_tokens": 4965600} {"current_steps": 3840, "total_steps": 12855, "loss": 0.7151, "accuracy": 0.8999999761581421, "learning_rate": 3.9776068270301406e-05, "epoch": 0.29871645274212366, "percentage": 29.87, "elapsed_time": "1:45:08", "remaining_time": "4:06:49", "throughput": 788.88, "total_tokens": 4976512} {"current_steps": 3850, "total_steps": 12855, "loss": 0.8862, "accuracy": 0.800000011920929, "learning_rate": 3.972674113181277e-05, "epoch": 0.2994943601711396, "percentage": 29.95, "elapsed_time": "1:45:28", "remaining_time": "4:06:41", "throughput": 788.91, "total_tokens": 4992464} {"current_steps": 3860, "total_steps": 12855, "loss": 0.9586, "accuracy": 1.0, "learning_rate": 3.9677326038022955e-05, "epoch": 0.3002722676001556, "percentage": 30.03, "elapsed_time": "1:45:45", "remaining_time": "4:06:26", "throughput": 789.08, "total_tokens": 5006896} {"current_steps": 3870, "total_steps": 12855, "loss": 0.9902, "accuracy": 0.8999999761581421, "learning_rate": 3.962782328406306e-05, "epoch": 0.30105017502917153, "percentage": 30.11, "elapsed_time": "1:45:55", "remaining_time": "4:05:56", "throughput": 789.28, "total_tokens": 5016528} {"current_steps": 3880, "total_steps": 12855, "loss": 1.0913, "accuracy": 0.800000011920929, "learning_rate": 3.9578233165587755e-05, "epoch": 0.3018280824581875, "percentage": 30.18, "elapsed_time": "1:46:19", "remaining_time": "4:05:56", "throughput": 788.88, "total_tokens": 5032528} {"current_steps": 3890, "total_steps": 12855, "loss": 0.8901, "accuracy": 1.0, "learning_rate": 3.9528555978773476e-05, "epoch": 0.30260598988720344, "percentage": 30.26, "elapsed_time": "1:46:30", "remaining_time": "4:05:28", "throughput": 789.17, "total_tokens": 5043472} {"current_steps": 3900, "total_steps": 12855, "loss": 0.9658, "accuracy": 0.800000011920929, "learning_rate": 3.9478792020316685e-05, "epoch": 0.3033838973162194, "percentage": 30.34, "elapsed_time": "1:46:53", "remaining_time": "4:05:25", "throughput": 789.08, "total_tokens": 5060352} {"current_steps": 3910, "total_steps": 12855, "loss": 0.8534, "accuracy": 1.0, "learning_rate": 3.9428941587432084e-05, "epoch": 0.3041618047452353, "percentage": 30.42, "elapsed_time": "1:47:04", "remaining_time": "4:04:57", "throughput": 789.13, "total_tokens": 5069808} {"current_steps": 3920, "total_steps": 12855, "loss": 0.8767, "accuracy": 1.0, "learning_rate": 3.937900497785083e-05, "epoch": 0.30493971217425125, "percentage": 30.49, "elapsed_time": "1:47:25", "remaining_time": "4:04:50", "throughput": 788.87, "total_tokens": 5084512} {"current_steps": 3930, "total_steps": 12855, "loss": 0.9163, "accuracy": 0.6000000238418579, "learning_rate": 3.93289824898188e-05, "epoch": 0.3057176196032672, "percentage": 30.57, "elapsed_time": "1:47:56", "remaining_time": "4:05:09", "throughput": 788.08, "total_tokens": 5104352} {"current_steps": 3940, "total_steps": 12855, "loss": 0.9711, "accuracy": 0.800000011920929, "learning_rate": 3.9278874422094735e-05, "epoch": 0.30649552703228317, "percentage": 30.65, "elapsed_time": "1:48:08", "remaining_time": "4:04:42", "throughput": 788.37, "total_tokens": 5115648} {"current_steps": 3950, "total_steps": 12855, "loss": 0.9282, "accuracy": 1.0, "learning_rate": 3.9228681073948545e-05, "epoch": 0.3072734344612991, "percentage": 30.73, "elapsed_time": "1:48:53", "remaining_time": "4:05:28", "throughput": 786.5, "total_tokens": 5138352} {"current_steps": 3960, "total_steps": 12855, "loss": 1.1391, "accuracy": 0.6000000238418579, "learning_rate": 3.917840274515945e-05, "epoch": 0.3080513418903151, "percentage": 30.81, "elapsed_time": "1:49:31", "remaining_time": "4:06:01", "throughput": 784.66, "total_tokens": 5156576} {"current_steps": 3970, "total_steps": 12855, "loss": 1.0275, "accuracy": 0.8999999761581421, "learning_rate": 3.9128039736014225e-05, "epoch": 0.308829249319331, "percentage": 30.88, "elapsed_time": "1:49:43", "remaining_time": "4:05:33", "throughput": 784.85, "total_tokens": 5167008} {"current_steps": 3980, "total_steps": 12855, "loss": 1.0453, "accuracy": 0.800000011920929, "learning_rate": 3.907759234730537e-05, "epoch": 0.30960715674834693, "percentage": 30.96, "elapsed_time": "1:49:58", "remaining_time": "4:05:14", "throughput": 784.89, "total_tokens": 5179360} {"current_steps": 3990, "total_steps": 12855, "loss": 1.1037, "accuracy": 0.8999999761581421, "learning_rate": 3.9027060880329394e-05, "epoch": 0.3103850641773629, "percentage": 31.04, "elapsed_time": "1:50:16", "remaining_time": "4:05:00", "throughput": 784.89, "total_tokens": 5193008} {"current_steps": 4000, "total_steps": 12855, "loss": 0.9933, "accuracy": 0.6000000238418579, "learning_rate": 3.897644563688493e-05, "epoch": 0.31116297160637885, "percentage": 31.12, "elapsed_time": "1:50:31", "remaining_time": "4:04:41", "throughput": 784.92, "total_tokens": 5205440} {"current_steps": 4010, "total_steps": 12855, "loss": 1.3451, "accuracy": 0.8999999761581421, "learning_rate": 3.892574691927096e-05, "epoch": 0.3119408790353948, "percentage": 31.19, "elapsed_time": "1:50:51", "remaining_time": "4:04:32", "throughput": 784.46, "total_tokens": 5218096} {"current_steps": 4020, "total_steps": 12855, "loss": 1.3005, "accuracy": 0.8999999761581421, "learning_rate": 3.887496503028501e-05, "epoch": 0.31271878646441076, "percentage": 31.27, "elapsed_time": "1:51:10", "remaining_time": "4:04:19", "throughput": 784.13, "total_tokens": 5230224} {"current_steps": 4030, "total_steps": 12855, "loss": 1.0805, "accuracy": 0.6000000238418579, "learning_rate": 3.88241002732214e-05, "epoch": 0.31349669389342666, "percentage": 31.35, "elapsed_time": "1:51:33", "remaining_time": "4:04:17", "throughput": 783.54, "total_tokens": 5244752} {"current_steps": 4040, "total_steps": 12855, "loss": 1.1504, "accuracy": 0.800000011920929, "learning_rate": 3.87731529518693e-05, "epoch": 0.3142746013224426, "percentage": 31.43, "elapsed_time": "1:51:50", "remaining_time": "4:04:02", "throughput": 783.58, "total_tokens": 5258256} {"current_steps": 4050, "total_steps": 12855, "loss": 1.0416, "accuracy": 0.699999988079071, "learning_rate": 3.8722123370511045e-05, "epoch": 0.31505250875145857, "percentage": 31.51, "elapsed_time": "1:52:02", "remaining_time": "4:03:35", "throughput": 784.02, "total_tokens": 5270784} {"current_steps": 4060, "total_steps": 12855, "loss": 0.8825, "accuracy": 1.0, "learning_rate": 3.8671011833920253e-05, "epoch": 0.3158304161804745, "percentage": 31.58, "elapsed_time": "1:52:18", "remaining_time": "4:03:16", "throughput": 784.15, "total_tokens": 5283760} {"current_steps": 4070, "total_steps": 12855, "loss": 0.656, "accuracy": 0.800000011920929, "learning_rate": 3.8619818647360036e-05, "epoch": 0.3166083236094905, "percentage": 31.66, "elapsed_time": "1:52:32", "remaining_time": "4:02:55", "throughput": 784.11, "total_tokens": 5294784} {"current_steps": 4080, "total_steps": 12855, "loss": 0.8613, "accuracy": 1.0, "learning_rate": 3.856854411658112e-05, "epoch": 0.31738623103850644, "percentage": 31.74, "elapsed_time": "1:52:44", "remaining_time": "4:02:29", "throughput": 784.3, "total_tokens": 5305744} {"current_steps": 4090, "total_steps": 12855, "loss": 0.9306, "accuracy": 0.8999999761581421, "learning_rate": 3.85171885478201e-05, "epoch": 0.31816413846752234, "percentage": 31.82, "elapsed_time": "1:53:03", "remaining_time": "4:02:17", "throughput": 784.17, "total_tokens": 5319440} {"current_steps": 4100, "total_steps": 12855, "loss": 1.4213, "accuracy": 0.699999988079071, "learning_rate": 3.846575224779754e-05, "epoch": 0.3189420458965383, "percentage": 31.89, "elapsed_time": "1:53:21", "remaining_time": "4:02:03", "throughput": 784.03, "total_tokens": 5332400} {"current_steps": 4110, "total_steps": 12855, "loss": 0.9302, "accuracy": 0.800000011920929, "learning_rate": 3.841423552371619e-05, "epoch": 0.31971995332555425, "percentage": 31.97, "elapsed_time": "1:53:39", "remaining_time": "4:01:50", "throughput": 783.83, "total_tokens": 5345552} {"current_steps": 4120, "total_steps": 12855, "loss": 0.8212, "accuracy": 0.8999999761581421, "learning_rate": 3.836263868325911e-05, "epoch": 0.3204978607545702, "percentage": 32.05, "elapsed_time": "1:53:56", "remaining_time": "4:01:34", "throughput": 783.97, "total_tokens": 5359504} {"current_steps": 4130, "total_steps": 12855, "loss": 1.0161, "accuracy": 0.8999999761581421, "learning_rate": 3.831096203458788e-05, "epoch": 0.32127576818358616, "percentage": 32.13, "elapsed_time": "1:54:13", "remaining_time": "4:01:18", "throughput": 784.08, "total_tokens": 5373568} {"current_steps": 4140, "total_steps": 12855, "loss": 1.0337, "accuracy": 0.8999999761581421, "learning_rate": 3.825920588634073e-05, "epoch": 0.3220536756126021, "percentage": 32.21, "elapsed_time": "1:54:24", "remaining_time": "4:00:50", "throughput": 784.2, "total_tokens": 5383136} {"current_steps": 4150, "total_steps": 12855, "loss": 1.0341, "accuracy": 0.8999999761581421, "learning_rate": 3.820737054763068e-05, "epoch": 0.322831583041618, "percentage": 32.28, "elapsed_time": "1:54:43", "remaining_time": "4:00:39", "throughput": 784.07, "total_tokens": 5397440} {"current_steps": 4160, "total_steps": 12855, "loss": 1.0286, "accuracy": 1.0, "learning_rate": 3.8155456328043735e-05, "epoch": 0.323609490470634, "percentage": 32.36, "elapsed_time": "1:54:56", "remaining_time": "4:00:14", "throughput": 784.18, "total_tokens": 5408160} {"current_steps": 4170, "total_steps": 12855, "loss": 0.8184, "accuracy": 0.699999988079071, "learning_rate": 3.8103463537636996e-05, "epoch": 0.32438739789964993, "percentage": 32.44, "elapsed_time": "1:55:09", "remaining_time": "3:59:51", "throughput": 784.24, "total_tokens": 5418992} {"current_steps": 4180, "total_steps": 12855, "loss": 1.1085, "accuracy": 0.699999988079071, "learning_rate": 3.8051392486936844e-05, "epoch": 0.3251653053286659, "percentage": 32.52, "elapsed_time": "1:55:33", "remaining_time": "3:59:48", "throughput": 784.05, "total_tokens": 5435808} {"current_steps": 4190, "total_steps": 12855, "loss": 1.0086, "accuracy": 0.8999999761581421, "learning_rate": 3.799924348693706e-05, "epoch": 0.32594321275768184, "percentage": 32.59, "elapsed_time": "1:55:55", "remaining_time": "3:59:44", "throughput": 783.38, "total_tokens": 5449056} {"current_steps": 4200, "total_steps": 12855, "loss": 1.2011, "accuracy": 0.800000011920929, "learning_rate": 3.794701684909698e-05, "epoch": 0.3267211201866978, "percentage": 32.67, "elapsed_time": "1:56:09", "remaining_time": "3:59:21", "throughput": 783.49, "total_tokens": 5460400} {"current_steps": 4210, "total_steps": 12855, "loss": 0.9318, "accuracy": 0.8999999761581421, "learning_rate": 3.7894712885339634e-05, "epoch": 0.32749902761571376, "percentage": 32.75, "elapsed_time": "1:56:43", "remaining_time": "3:59:40", "throughput": 782.37, "total_tokens": 5478928} {"current_steps": 4220, "total_steps": 12855, "loss": 0.8587, "accuracy": 0.800000011920929, "learning_rate": 3.784233190804988e-05, "epoch": 0.32827693504472966, "percentage": 32.83, "elapsed_time": "1:57:19", "remaining_time": "4:00:05", "throughput": 780.91, "total_tokens": 5497600} {"current_steps": 4230, "total_steps": 12855, "loss": 0.8841, "accuracy": 0.800000011920929, "learning_rate": 3.778987423007252e-05, "epoch": 0.3290548424737456, "percentage": 32.91, "elapsed_time": "1:57:38", "remaining_time": "3:59:52", "throughput": 780.71, "total_tokens": 5510512} {"current_steps": 4240, "total_steps": 12855, "loss": 0.9538, "accuracy": 0.8999999761581421, "learning_rate": 3.7737340164710474e-05, "epoch": 0.32983274990276157, "percentage": 32.98, "elapsed_time": "1:57:53", "remaining_time": "3:59:32", "throughput": 780.81, "total_tokens": 5522992} {"current_steps": 4250, "total_steps": 12855, "loss": 1.0076, "accuracy": 0.800000011920929, "learning_rate": 3.7684730025722884e-05, "epoch": 0.3306106573317775, "percentage": 33.06, "elapsed_time": "1:58:16", "remaining_time": "3:59:29", "throughput": 780.54, "total_tokens": 5539344} {"current_steps": 4260, "total_steps": 12855, "loss": 0.9729, "accuracy": 0.8999999761581421, "learning_rate": 3.7632044127323216e-05, "epoch": 0.3313885647607935, "percentage": 33.14, "elapsed_time": "1:58:39", "remaining_time": "3:59:23", "throughput": 780.32, "total_tokens": 5555152} {"current_steps": 4270, "total_steps": 12855, "loss": 0.9353, "accuracy": 0.800000011920929, "learning_rate": 3.7579282784177436e-05, "epoch": 0.33216647218980944, "percentage": 33.22, "elapsed_time": "1:58:52", "remaining_time": "3:59:01", "throughput": 780.35, "total_tokens": 5566192} {"current_steps": 4280, "total_steps": 12855, "loss": 0.7786, "accuracy": 0.8999999761581421, "learning_rate": 3.7526446311402095e-05, "epoch": 0.33294437961882534, "percentage": 33.29, "elapsed_time": "1:59:13", "remaining_time": "3:58:51", "throughput": 780.13, "total_tokens": 5580640} {"current_steps": 4290, "total_steps": 12855, "loss": 0.9205, "accuracy": 0.699999988079071, "learning_rate": 3.7473535024562446e-05, "epoch": 0.3337222870478413, "percentage": 33.37, "elapsed_time": "1:59:26", "remaining_time": "3:58:28", "throughput": 780.19, "total_tokens": 5591376} {"current_steps": 4300, "total_steps": 12855, "loss": 0.8458, "accuracy": 0.800000011920929, "learning_rate": 3.742054923967057e-05, "epoch": 0.33450019447685725, "percentage": 33.45, "elapsed_time": "1:59:51", "remaining_time": "3:58:27", "throughput": 779.63, "total_tokens": 5606752} {"current_steps": 4310, "total_steps": 12855, "loss": 0.7059, "accuracy": 0.8999999761581421, "learning_rate": 3.7367489273183495e-05, "epoch": 0.3352781019058732, "percentage": 33.53, "elapsed_time": "2:00:09", "remaining_time": "3:58:12", "throughput": 779.41, "total_tokens": 5618800} {"current_steps": 4320, "total_steps": 12855, "loss": 1.079, "accuracy": 0.8999999761581421, "learning_rate": 3.7314355442001294e-05, "epoch": 0.33605600933488916, "percentage": 33.61, "elapsed_time": "2:00:27", "remaining_time": "3:57:58", "throughput": 779.05, "total_tokens": 5630448} {"current_steps": 4330, "total_steps": 12855, "loss": 0.9621, "accuracy": 0.8999999761581421, "learning_rate": 3.726114806346518e-05, "epoch": 0.3368339167639051, "percentage": 33.68, "elapsed_time": "2:00:43", "remaining_time": "3:57:41", "throughput": 779.12, "total_tokens": 5643584} {"current_steps": 4340, "total_steps": 12855, "loss": 1.0142, "accuracy": 0.8999999761581421, "learning_rate": 3.720786745535568e-05, "epoch": 0.337611824192921, "percentage": 33.76, "elapsed_time": "2:00:58", "remaining_time": "3:57:21", "throughput": 779.26, "total_tokens": 5656624} {"current_steps": 4350, "total_steps": 12855, "loss": 0.9231, "accuracy": 0.699999988079071, "learning_rate": 3.7154513935890614e-05, "epoch": 0.338389731621937, "percentage": 33.84, "elapsed_time": "2:01:12", "remaining_time": "3:56:58", "throughput": 779.24, "total_tokens": 5666960} {"current_steps": 4360, "total_steps": 12855, "loss": 1.18, "accuracy": 0.699999988079071, "learning_rate": 3.710108782372331e-05, "epoch": 0.33916763905095293, "percentage": 33.92, "elapsed_time": "2:01:31", "remaining_time": "3:56:46", "throughput": 778.92, "total_tokens": 5679232} {"current_steps": 4370, "total_steps": 12855, "loss": 0.9895, "accuracy": 0.699999988079071, "learning_rate": 3.7047589437940636e-05, "epoch": 0.3399455464799689, "percentage": 33.99, "elapsed_time": "2:01:47", "remaining_time": "3:56:29", "throughput": 778.69, "total_tokens": 5690656} {"current_steps": 4380, "total_steps": 12855, "loss": 0.9972, "accuracy": 0.6000000238418579, "learning_rate": 3.6994019098061123e-05, "epoch": 0.34072345390898484, "percentage": 34.07, "elapsed_time": "2:02:05", "remaining_time": "3:56:13", "throughput": 778.44, "total_tokens": 5702304} {"current_steps": 4390, "total_steps": 12855, "loss": 0.9975, "accuracy": 0.6000000238418579, "learning_rate": 3.6940377124033033e-05, "epoch": 0.3415013613380008, "percentage": 34.15, "elapsed_time": "2:02:16", "remaining_time": "3:55:46", "throughput": 778.74, "total_tokens": 5713360} {"current_steps": 4400, "total_steps": 12855, "loss": 1.1692, "accuracy": 0.4000000059604645, "learning_rate": 3.688666383623249e-05, "epoch": 0.3422792687670167, "percentage": 34.23, "elapsed_time": "2:02:34", "remaining_time": "3:55:31", "throughput": 778.87, "total_tokens": 5728016} {"current_steps": 4410, "total_steps": 12855, "loss": 0.9998, "accuracy": 1.0, "learning_rate": 3.6832879555461507e-05, "epoch": 0.34305717619603265, "percentage": 34.31, "elapsed_time": "2:02:51", "remaining_time": "3:55:16", "throughput": 779.03, "total_tokens": 5742624} {"current_steps": 4420, "total_steps": 12855, "loss": 0.9744, "accuracy": 0.8999999761581421, "learning_rate": 3.677902460294612e-05, "epoch": 0.3438350836250486, "percentage": 34.38, "elapsed_time": "2:03:08", "remaining_time": "3:55:00", "throughput": 779.13, "total_tokens": 5756800} {"current_steps": 4430, "total_steps": 12855, "loss": 0.9084, "accuracy": 1.0, "learning_rate": 3.6725099300334446e-05, "epoch": 0.34461299105406457, "percentage": 34.46, "elapsed_time": "2:03:19", "remaining_time": "3:54:32", "throughput": 779.69, "total_tokens": 5769152} {"current_steps": 4440, "total_steps": 12855, "loss": 1.0324, "accuracy": 1.0, "learning_rate": 3.667110396969477e-05, "epoch": 0.3453908984830805, "percentage": 34.54, "elapsed_time": "2:03:41", "remaining_time": "3:54:26", "throughput": 779.67, "total_tokens": 5786576} {"current_steps": 4450, "total_steps": 12855, "loss": 0.9945, "accuracy": 0.8999999761581421, "learning_rate": 3.661703893351361e-05, "epoch": 0.3461688059120965, "percentage": 34.62, "elapsed_time": "2:03:56", "remaining_time": "3:54:05", "throughput": 779.89, "total_tokens": 5799632} {"current_steps": 4460, "total_steps": 12855, "loss": 0.8456, "accuracy": 1.0, "learning_rate": 3.656290451469382e-05, "epoch": 0.34694671334111243, "percentage": 34.69, "elapsed_time": "2:04:08", "remaining_time": "3:53:40", "throughput": 780.14, "total_tokens": 5811184} {"current_steps": 4470, "total_steps": 12855, "loss": 0.9886, "accuracy": 0.800000011920929, "learning_rate": 3.6508701036552624e-05, "epoch": 0.34772462077012833, "percentage": 34.77, "elapsed_time": "2:04:22", "remaining_time": "3:53:18", "throughput": 780.35, "total_tokens": 5823296} {"current_steps": 4480, "total_steps": 12855, "loss": 1.1549, "accuracy": 0.800000011920929, "learning_rate": 3.6454428822819695e-05, "epoch": 0.3485025281991443, "percentage": 34.85, "elapsed_time": "2:04:37", "remaining_time": "3:52:59", "throughput": 780.55, "total_tokens": 5836768} {"current_steps": 4490, "total_steps": 12855, "loss": 1.2687, "accuracy": 0.6000000238418579, "learning_rate": 3.640008819763525e-05, "epoch": 0.34928043562816025, "percentage": 34.93, "elapsed_time": "2:04:50", "remaining_time": "3:52:35", "throughput": 780.65, "total_tokens": 5847728} {"current_steps": 4500, "total_steps": 12855, "loss": 1.0606, "accuracy": 0.800000011920929, "learning_rate": 3.634567948554807e-05, "epoch": 0.3500583430571762, "percentage": 35.01, "elapsed_time": "2:05:07", "remaining_time": "3:52:18", "throughput": 780.84, "total_tokens": 5861776} {"current_steps": 4510, "total_steps": 12855, "loss": 1.0608, "accuracy": 1.0, "learning_rate": 3.62912030115136e-05, "epoch": 0.35083625048619216, "percentage": 35.08, "elapsed_time": "2:05:19", "remaining_time": "3:51:53", "throughput": 781.0, "total_tokens": 5872640} {"current_steps": 4520, "total_steps": 12855, "loss": 1.0176, "accuracy": 1.0, "learning_rate": 3.6236659100892e-05, "epoch": 0.3516141579152081, "percentage": 35.16, "elapsed_time": "2:05:47", "remaining_time": "3:51:57", "throughput": 780.67, "total_tokens": 5892208} {"current_steps": 4530, "total_steps": 12855, "loss": 0.8963, "accuracy": 0.699999988079071, "learning_rate": 3.618204807944617e-05, "epoch": 0.352392065344224, "percentage": 35.24, "elapsed_time": "2:05:58", "remaining_time": "3:51:30", "throughput": 780.99, "total_tokens": 5903216} {"current_steps": 4540, "total_steps": 12855, "loss": 0.921, "accuracy": 1.0, "learning_rate": 3.612737027333984e-05, "epoch": 0.35316997277323997, "percentage": 35.32, "elapsed_time": "2:06:16", "remaining_time": "3:51:15", "throughput": 781.22, "total_tokens": 5918576} {"current_steps": 4550, "total_steps": 12855, "loss": 0.8021, "accuracy": 1.0, "learning_rate": 3.607262600913563e-05, "epoch": 0.3539478802022559, "percentage": 35.39, "elapsed_time": "2:06:34", "remaining_time": "3:51:02", "throughput": 780.95, "total_tokens": 5931248} {"current_steps": 4560, "total_steps": 12855, "loss": 1.1528, "accuracy": 0.6000000238418579, "learning_rate": 3.601781561379304e-05, "epoch": 0.3547257876312719, "percentage": 35.47, "elapsed_time": "2:06:52", "remaining_time": "3:50:47", "throughput": 780.99, "total_tokens": 5945392} {"current_steps": 4570, "total_steps": 12855, "loss": 0.8622, "accuracy": 0.8999999761581421, "learning_rate": 3.596293941466658e-05, "epoch": 0.35550369506028784, "percentage": 35.55, "elapsed_time": "2:07:03", "remaining_time": "3:50:20", "throughput": 781.33, "total_tokens": 5956272} {"current_steps": 4580, "total_steps": 12855, "loss": 0.811, "accuracy": 0.8999999761581421, "learning_rate": 3.5907997739503735e-05, "epoch": 0.3562816024893038, "percentage": 35.63, "elapsed_time": "2:07:15", "remaining_time": "3:49:56", "throughput": 781.66, "total_tokens": 5968640} {"current_steps": 4590, "total_steps": 12855, "loss": 0.9329, "accuracy": 0.800000011920929, "learning_rate": 3.585299091644307e-05, "epoch": 0.3570595099183197, "percentage": 35.71, "elapsed_time": "2:07:26", "remaining_time": "3:49:28", "throughput": 781.79, "total_tokens": 5977824} {"current_steps": 4600, "total_steps": 12855, "loss": 1.056, "accuracy": 0.8999999761581421, "learning_rate": 3.5797919274012235e-05, "epoch": 0.35783741734733565, "percentage": 35.78, "elapsed_time": "2:07:33", "remaining_time": "3:48:54", "throughput": 782.11, "total_tokens": 5985584} {"current_steps": 4610, "total_steps": 12855, "loss": 0.9462, "accuracy": 0.699999988079071, "learning_rate": 3.5742783141126016e-05, "epoch": 0.3586153247763516, "percentage": 35.86, "elapsed_time": "2:07:48", "remaining_time": "3:48:35", "throughput": 782.32, "total_tokens": 5999360} {"current_steps": 4620, "total_steps": 12855, "loss": 0.8354, "accuracy": 0.8999999761581421, "learning_rate": 3.568758284708437e-05, "epoch": 0.35939323220536756, "percentage": 35.94, "elapsed_time": "2:08:00", "remaining_time": "3:48:10", "throughput": 782.51, "total_tokens": 6010208} {"current_steps": 4630, "total_steps": 12855, "loss": 1.0469, "accuracy": 1.0, "learning_rate": 3.563231872157045e-05, "epoch": 0.3601711396343835, "percentage": 36.02, "elapsed_time": "2:08:13", "remaining_time": "3:47:47", "throughput": 782.67, "total_tokens": 6021760} {"current_steps": 4640, "total_steps": 12855, "loss": 0.8721, "accuracy": 1.0, "learning_rate": 3.557699109464865e-05, "epoch": 0.3609490470633995, "percentage": 36.09, "elapsed_time": "2:08:34", "remaining_time": "3:47:38", "throughput": 782.55, "total_tokens": 6036992} {"current_steps": 4650, "total_steps": 12855, "loss": 0.9025, "accuracy": 0.699999988079071, "learning_rate": 3.55216002967626e-05, "epoch": 0.3617269544924154, "percentage": 36.17, "elapsed_time": "2:08:46", "remaining_time": "3:47:14", "throughput": 782.73, "total_tokens": 6048112} {"current_steps": 4660, "total_steps": 12855, "loss": 1.0348, "accuracy": 0.800000011920929, "learning_rate": 3.546614665873326e-05, "epoch": 0.36250486192143133, "percentage": 36.25, "elapsed_time": "2:09:05", "remaining_time": "3:47:00", "throughput": 783.01, "total_tokens": 6064512} {"current_steps": 4670, "total_steps": 12855, "loss": 1.0076, "accuracy": 0.8999999761581421, "learning_rate": 3.5410630511756874e-05, "epoch": 0.3632827693504473, "percentage": 36.33, "elapsed_time": "2:09:33", "remaining_time": "3:47:04", "throughput": 782.55, "total_tokens": 6083280} {"current_steps": 4680, "total_steps": 12855, "loss": 0.9727, "accuracy": 0.699999988079071, "learning_rate": 3.535505218740303e-05, "epoch": 0.36406067677946324, "percentage": 36.41, "elapsed_time": "2:09:51", "remaining_time": "3:46:49", "throughput": 782.74, "total_tokens": 6098496} {"current_steps": 4690, "total_steps": 12855, "loss": 0.8889, "accuracy": 1.0, "learning_rate": 3.529941201761264e-05, "epoch": 0.3648385842084792, "percentage": 36.48, "elapsed_time": "2:10:07", "remaining_time": "3:46:31", "throughput": 782.76, "total_tokens": 6111008} {"current_steps": 4700, "total_steps": 12855, "loss": 0.9603, "accuracy": 0.6000000238418579, "learning_rate": 3.5243710334696047e-05, "epoch": 0.36561649163749516, "percentage": 36.56, "elapsed_time": "2:10:23", "remaining_time": "3:46:14", "throughput": 782.71, "total_tokens": 6123424} {"current_steps": 4710, "total_steps": 12855, "loss": 0.9565, "accuracy": 0.8999999761581421, "learning_rate": 3.5187947471330925e-05, "epoch": 0.3663943990665111, "percentage": 36.64, "elapsed_time": "2:10:41", "remaining_time": "3:46:00", "throughput": 782.78, "total_tokens": 6138416} {"current_steps": 4720, "total_steps": 12855, "loss": 0.9693, "accuracy": 0.800000011920929, "learning_rate": 3.5132123760560375e-05, "epoch": 0.367172306495527, "percentage": 36.72, "elapsed_time": "2:11:00", "remaining_time": "3:45:48", "throughput": 782.75, "total_tokens": 6153056} {"current_steps": 4730, "total_steps": 12855, "loss": 1.049, "accuracy": 0.800000011920929, "learning_rate": 3.507623953579091e-05, "epoch": 0.36795021392454297, "percentage": 36.8, "elapsed_time": "2:11:10", "remaining_time": "3:45:19", "throughput": 782.89, "total_tokens": 6161680} {"current_steps": 4740, "total_steps": 12855, "loss": 0.9243, "accuracy": 0.699999988079071, "learning_rate": 3.502029513079043e-05, "epoch": 0.3687281213535589, "percentage": 36.87, "elapsed_time": "2:11:34", "remaining_time": "3:45:16", "throughput": 782.82, "total_tokens": 6180208} {"current_steps": 4750, "total_steps": 12855, "loss": 0.7439, "accuracy": 0.8999999761581421, "learning_rate": 3.496429087968631e-05, "epoch": 0.3695060287825749, "percentage": 36.95, "elapsed_time": "2:11:47", "remaining_time": "3:44:53", "throughput": 783.0, "total_tokens": 6191808} {"current_steps": 4760, "total_steps": 12855, "loss": 0.9078, "accuracy": 0.8999999761581421, "learning_rate": 3.490822711696333e-05, "epoch": 0.37028393621159084, "percentage": 37.03, "elapsed_time": "2:12:04", "remaining_time": "3:44:36", "throughput": 783.17, "total_tokens": 6206112} {"current_steps": 4770, "total_steps": 12855, "loss": 1.0323, "accuracy": 0.800000011920929, "learning_rate": 3.4852104177461685e-05, "epoch": 0.3710618436406068, "percentage": 37.11, "elapsed_time": "2:12:45", "remaining_time": "3:45:00", "throughput": 781.37, "total_tokens": 6223760} {"current_steps": 4780, "total_steps": 12855, "loss": 0.8294, "accuracy": 0.6000000238418579, "learning_rate": 3.4795922396375034e-05, "epoch": 0.3718397510696227, "percentage": 37.18, "elapsed_time": "2:12:55", "remaining_time": "3:44:33", "throughput": 781.45, "total_tokens": 6232512} {"current_steps": 4790, "total_steps": 12855, "loss": 0.9189, "accuracy": 1.0, "learning_rate": 3.473968210924845e-05, "epoch": 0.37261765849863865, "percentage": 37.26, "elapsed_time": "2:13:20", "remaining_time": "3:44:29", "throughput": 781.27, "total_tokens": 6250160} {"current_steps": 4800, "total_steps": 12855, "loss": 0.9124, "accuracy": 0.8999999761581421, "learning_rate": 3.468338365197643e-05, "epoch": 0.3733955659276546, "percentage": 37.34, "elapsed_time": "2:13:35", "remaining_time": "3:44:10", "throughput": 781.35, "total_tokens": 6262560} {"current_steps": 4810, "total_steps": 12855, "loss": 0.9097, "accuracy": 0.800000011920929, "learning_rate": 3.4627027360800914e-05, "epoch": 0.37417347335667056, "percentage": 37.42, "elapsed_time": "2:13:52", "remaining_time": "3:43:55", "throughput": 781.41, "total_tokens": 6276928} {"current_steps": 4820, "total_steps": 12855, "loss": 0.9624, "accuracy": 0.800000011920929, "learning_rate": 3.457061357230922e-05, "epoch": 0.3749513807856865, "percentage": 37.5, "elapsed_time": "2:14:13", "remaining_time": "3:43:44", "throughput": 781.56, "total_tokens": 6293984} {"current_steps": 4830, "total_steps": 12855, "loss": 1.0058, "accuracy": 0.8999999761581421, "learning_rate": 3.451414262343209e-05, "epoch": 0.3757292882147025, "percentage": 37.57, "elapsed_time": "2:14:32", "remaining_time": "3:43:32", "throughput": 781.65, "total_tokens": 6309888} {"current_steps": 4840, "total_steps": 12855, "loss": 1.0167, "accuracy": 0.800000011920929, "learning_rate": 3.4457614851441664e-05, "epoch": 0.3765071956437184, "percentage": 37.65, "elapsed_time": "2:14:41", "remaining_time": "3:43:02", "throughput": 781.98, "total_tokens": 6319312} {"current_steps": 4850, "total_steps": 12855, "loss": 1.0703, "accuracy": 0.800000011920929, "learning_rate": 3.440103059394942e-05, "epoch": 0.37728510307273433, "percentage": 37.73, "elapsed_time": "2:14:54", "remaining_time": "3:42:40", "throughput": 782.12, "total_tokens": 6331040} {"current_steps": 4860, "total_steps": 12855, "loss": 1.1907, "accuracy": 1.0, "learning_rate": 3.434439018890425e-05, "epoch": 0.3780630105017503, "percentage": 37.81, "elapsed_time": "2:15:12", "remaining_time": "3:42:25", "throughput": 782.2, "total_tokens": 6345360} {"current_steps": 4870, "total_steps": 12855, "loss": 1.2152, "accuracy": 0.8999999761581421, "learning_rate": 3.428769397459034e-05, "epoch": 0.37884091793076624, "percentage": 37.88, "elapsed_time": "2:15:27", "remaining_time": "3:42:05", "throughput": 782.4, "total_tokens": 6358656} {"current_steps": 4880, "total_steps": 12855, "loss": 1.0262, "accuracy": 1.0, "learning_rate": 3.423094228962522e-05, "epoch": 0.3796188253597822, "percentage": 37.96, "elapsed_time": "2:15:44", "remaining_time": "3:41:50", "throughput": 782.5, "total_tokens": 6373184} {"current_steps": 4890, "total_steps": 12855, "loss": 0.6428, "accuracy": 0.8999999761581421, "learning_rate": 3.41741354729577e-05, "epoch": 0.38039673278879815, "percentage": 38.04, "elapsed_time": "2:16:07", "remaining_time": "3:41:42", "throughput": 782.17, "total_tokens": 6388032} {"current_steps": 4900, "total_steps": 12855, "loss": 0.9343, "accuracy": 0.8999999761581421, "learning_rate": 3.411727386386589e-05, "epoch": 0.38117464021781405, "percentage": 38.12, "elapsed_time": "2:16:30", "remaining_time": "3:41:37", "throughput": 782.11, "total_tokens": 6406128} {"current_steps": 4910, "total_steps": 12855, "loss": 0.8708, "accuracy": 1.0, "learning_rate": 3.406035780195512e-05, "epoch": 0.38195254764683, "percentage": 38.2, "elapsed_time": "2:16:44", "remaining_time": "3:41:16", "throughput": 782.14, "total_tokens": 6417088} {"current_steps": 4920, "total_steps": 12855, "loss": 1.0928, "accuracy": 0.6000000238418579, "learning_rate": 3.400338762715595e-05, "epoch": 0.38273045507584597, "percentage": 38.27, "elapsed_time": "2:17:06", "remaining_time": "3:41:08", "throughput": 781.83, "total_tokens": 6432048} {"current_steps": 4930, "total_steps": 12855, "loss": 0.8965, "accuracy": 0.6000000238418579, "learning_rate": 3.394636367972214e-05, "epoch": 0.3835083625048619, "percentage": 38.35, "elapsed_time": "2:17:21", "remaining_time": "3:40:47", "throughput": 781.99, "total_tokens": 6444384} {"current_steps": 4940, "total_steps": 12855, "loss": 0.9343, "accuracy": 0.800000011920929, "learning_rate": 3.388928630022858e-05, "epoch": 0.3842862699338779, "percentage": 38.43, "elapsed_time": "2:17:38", "remaining_time": "3:40:32", "throughput": 782.07, "total_tokens": 6458848} {"current_steps": 4950, "total_steps": 12855, "loss": 0.7843, "accuracy": 0.800000011920929, "learning_rate": 3.383215582956931e-05, "epoch": 0.38506417736289383, "percentage": 38.51, "elapsed_time": "2:17:55", "remaining_time": "3:40:15", "throughput": 782.16, "total_tokens": 6472848} {"current_steps": 4960, "total_steps": 12855, "loss": 0.817, "accuracy": 1.0, "learning_rate": 3.377497260895545e-05, "epoch": 0.3858420847919098, "percentage": 38.58, "elapsed_time": "2:18:16", "remaining_time": "3:40:05", "throughput": 782.19, "total_tokens": 6489472} {"current_steps": 4970, "total_steps": 12855, "loss": 1.0363, "accuracy": 0.699999988079071, "learning_rate": 3.371773697991315e-05, "epoch": 0.3866199922209257, "percentage": 38.66, "elapsed_time": "2:18:34", "remaining_time": "3:39:51", "throughput": 782.32, "total_tokens": 6504976} {"current_steps": 4980, "total_steps": 12855, "loss": 1.0743, "accuracy": 0.8999999761581421, "learning_rate": 3.366044928428158e-05, "epoch": 0.38739789964994165, "percentage": 38.74, "elapsed_time": "2:18:47", "remaining_time": "3:39:27", "throughput": 782.57, "total_tokens": 6516480} {"current_steps": 4990, "total_steps": 12855, "loss": 0.7821, "accuracy": 0.8999999761581421, "learning_rate": 3.3603109864210885e-05, "epoch": 0.3881758070789576, "percentage": 38.82, "elapsed_time": "2:19:00", "remaining_time": "3:39:05", "throughput": 782.66, "total_tokens": 6527696} {"current_steps": 5000, "total_steps": 12855, "loss": 0.8372, "accuracy": 0.8999999761581421, "learning_rate": 3.354571906216013e-05, "epoch": 0.38895371450797356, "percentage": 38.9, "elapsed_time": "2:19:12", "remaining_time": "3:38:42", "throughput": 782.85, "total_tokens": 6539104} {"current_steps": 5010, "total_steps": 12855, "loss": 0.8656, "accuracy": 0.8999999761581421, "learning_rate": 3.3488277220895255e-05, "epoch": 0.3897316219369895, "percentage": 38.97, "elapsed_time": "2:19:33", "remaining_time": "3:38:31", "throughput": 782.45, "total_tokens": 6551712} {"current_steps": 5020, "total_steps": 12855, "loss": 1.2445, "accuracy": 1.0, "learning_rate": 3.343078468348703e-05, "epoch": 0.39050952936600547, "percentage": 39.05, "elapsed_time": "2:19:53", "remaining_time": "3:38:19", "throughput": 782.63, "total_tokens": 6568784} {"current_steps": 5030, "total_steps": 12855, "loss": 0.7005, "accuracy": 1.0, "learning_rate": 3.337324179330901e-05, "epoch": 0.39128743679502137, "percentage": 39.13, "elapsed_time": "2:20:10", "remaining_time": "3:38:04", "throughput": 782.71, "total_tokens": 6583136} {"current_steps": 5040, "total_steps": 12855, "loss": 1.0596, "accuracy": 1.0, "learning_rate": 3.331564889403547e-05, "epoch": 0.3920653442240373, "percentage": 39.21, "elapsed_time": "2:20:26", "remaining_time": "3:37:45", "throughput": 782.83, "total_tokens": 6596496} {"current_steps": 5050, "total_steps": 12855, "loss": 0.9209, "accuracy": 0.8999999761581421, "learning_rate": 3.3258006329639394e-05, "epoch": 0.3928432516530533, "percentage": 39.28, "elapsed_time": "2:20:45", "remaining_time": "3:37:33", "throughput": 782.71, "total_tokens": 6610672} {"current_steps": 5060, "total_steps": 12855, "loss": 1.0244, "accuracy": 0.8999999761581421, "learning_rate": 3.320031444439036e-05, "epoch": 0.39362115908206924, "percentage": 39.36, "elapsed_time": "2:21:05", "remaining_time": "3:37:21", "throughput": 782.75, "total_tokens": 6626704} {"current_steps": 5070, "total_steps": 12855, "loss": 0.8377, "accuracy": 0.8999999761581421, "learning_rate": 3.314257358285253e-05, "epoch": 0.3943990665110852, "percentage": 39.44, "elapsed_time": "2:21:38", "remaining_time": "3:37:29", "throughput": 781.8, "total_tokens": 6644080} {"current_steps": 5080, "total_steps": 12855, "loss": 0.9787, "accuracy": 1.0, "learning_rate": 3.308478408988256e-05, "epoch": 0.39517697394010115, "percentage": 39.52, "elapsed_time": "2:21:52", "remaining_time": "3:37:09", "throughput": 781.92, "total_tokens": 6656352} {"current_steps": 5090, "total_steps": 12855, "loss": 0.8558, "accuracy": 0.8999999761581421, "learning_rate": 3.3026946310627575e-05, "epoch": 0.39595488136911705, "percentage": 39.6, "elapsed_time": "2:22:11", "remaining_time": "3:36:54", "throughput": 781.98, "total_tokens": 6671216} {"current_steps": 5100, "total_steps": 12855, "loss": 0.9509, "accuracy": 0.8999999761581421, "learning_rate": 3.296906059052308e-05, "epoch": 0.396732788798133, "percentage": 39.67, "elapsed_time": "2:22:28", "remaining_time": "3:36:38", "throughput": 782.17, "total_tokens": 6686496} {"current_steps": 5110, "total_steps": 12855, "loss": 0.9321, "accuracy": 1.0, "learning_rate": 3.2911127275290923e-05, "epoch": 0.39751069622714896, "percentage": 39.75, "elapsed_time": "2:22:39", "remaining_time": "3:36:13", "throughput": 782.35, "total_tokens": 6696800} {"current_steps": 5120, "total_steps": 12855, "loss": 0.8923, "accuracy": 0.800000011920929, "learning_rate": 3.285314671093717e-05, "epoch": 0.3982886036561649, "percentage": 39.83, "elapsed_time": "2:23:00", "remaining_time": "3:36:02", "throughput": 782.21, "total_tokens": 6711424} {"current_steps": 5130, "total_steps": 12855, "loss": 0.9994, "accuracy": 0.8999999761581421, "learning_rate": 3.279511924375014e-05, "epoch": 0.3990665110851809, "percentage": 39.91, "elapsed_time": "2:23:12", "remaining_time": "3:35:38", "throughput": 782.3, "total_tokens": 6721808} {"current_steps": 5140, "total_steps": 12855, "loss": 0.9936, "accuracy": 1.0, "learning_rate": 3.273704522029824e-05, "epoch": 0.39984441851419683, "percentage": 39.98, "elapsed_time": "2:23:34", "remaining_time": "3:35:30", "throughput": 782.25, "total_tokens": 6738656} {"current_steps": 5150, "total_steps": 12855, "loss": 1.35, "accuracy": 0.8999999761581421, "learning_rate": 3.2678924987427935e-05, "epoch": 0.40062232594321273, "percentage": 40.06, "elapsed_time": "2:23:45", "remaining_time": "3:35:05", "throughput": 782.37, "total_tokens": 6748608} {"current_steps": 5160, "total_steps": 12855, "loss": 1.3293, "accuracy": 0.8999999761581421, "learning_rate": 3.2620758892261684e-05, "epoch": 0.4014002333722287, "percentage": 40.14, "elapsed_time": "2:23:56", "remaining_time": "3:34:39", "throughput": 782.6, "total_tokens": 6759200} {"current_steps": 5170, "total_steps": 12855, "loss": 0.8285, "accuracy": 1.0, "learning_rate": 3.2562547282195864e-05, "epoch": 0.40217814080124464, "percentage": 40.22, "elapsed_time": "2:24:13", "remaining_time": "3:34:23", "throughput": 782.8, "total_tokens": 6774192} {"current_steps": 5180, "total_steps": 12855, "loss": 0.9387, "accuracy": 1.0, "learning_rate": 3.250429050489868e-05, "epoch": 0.4029560482302606, "percentage": 40.3, "elapsed_time": "2:24:26", "remaining_time": "3:34:01", "throughput": 782.96, "total_tokens": 6785632} {"current_steps": 5190, "total_steps": 12855, "loss": 1.1392, "accuracy": 1.0, "learning_rate": 3.244598890830811e-05, "epoch": 0.40373395565927656, "percentage": 40.37, "elapsed_time": "2:24:39", "remaining_time": "3:33:38", "throughput": 783.1, "total_tokens": 6796816} {"current_steps": 5200, "total_steps": 12855, "loss": 1.0181, "accuracy": 0.8999999761581421, "learning_rate": 3.2387642840629795e-05, "epoch": 0.4045118630882925, "percentage": 40.45, "elapsed_time": "2:24:49", "remaining_time": "3:33:12", "throughput": 783.42, "total_tokens": 6807600} {"current_steps": 5210, "total_steps": 12855, "loss": 1.2985, "accuracy": 1.0, "learning_rate": 3.232925265033499e-05, "epoch": 0.40528977051730847, "percentage": 40.53, "elapsed_time": "2:25:02", "remaining_time": "3:32:49", "throughput": 783.49, "total_tokens": 6818256} {"current_steps": 5220, "total_steps": 12855, "loss": 0.9, "accuracy": 1.0, "learning_rate": 3.227081868615847e-05, "epoch": 0.40606767794632437, "percentage": 40.61, "elapsed_time": "2:25:12", "remaining_time": "3:32:23", "throughput": 783.65, "total_tokens": 6827504} {"current_steps": 5230, "total_steps": 12855, "loss": 0.9842, "accuracy": 1.0, "learning_rate": 3.221234129709645e-05, "epoch": 0.4068455853753403, "percentage": 40.68, "elapsed_time": "2:25:25", "remaining_time": "3:32:01", "throughput": 783.73, "total_tokens": 6838800} {"current_steps": 5240, "total_steps": 12855, "loss": 1.1193, "accuracy": 0.8999999761581421, "learning_rate": 3.215382083240451e-05, "epoch": 0.4076234928043563, "percentage": 40.76, "elapsed_time": "2:25:40", "remaining_time": "3:31:42", "throughput": 783.71, "total_tokens": 6850048} {"current_steps": 5250, "total_steps": 12855, "loss": 0.702, "accuracy": 0.8999999761581421, "learning_rate": 3.209525764159548e-05, "epoch": 0.40840140023337224, "percentage": 40.84, "elapsed_time": "2:25:55", "remaining_time": "3:31:22", "throughput": 783.92, "total_tokens": 6863520} {"current_steps": 5260, "total_steps": 12855, "loss": 0.788, "accuracy": 1.0, "learning_rate": 3.203665207443738e-05, "epoch": 0.4091793076623882, "percentage": 40.92, "elapsed_time": "2:26:07", "remaining_time": "3:30:59", "throughput": 784.03, "total_tokens": 6873776} {"current_steps": 5270, "total_steps": 12855, "loss": 0.9847, "accuracy": 1.0, "learning_rate": 3.197800448095133e-05, "epoch": 0.40995721509140415, "percentage": 41.0, "elapsed_time": "2:26:27", "remaining_time": "3:30:47", "throughput": 784.11, "total_tokens": 6890400} {"current_steps": 5280, "total_steps": 12855, "loss": 1.4162, "accuracy": 0.699999988079071, "learning_rate": 3.191931521140943e-05, "epoch": 0.41073512252042005, "percentage": 41.07, "elapsed_time": "2:26:48", "remaining_time": "3:30:37", "throughput": 784.09, "total_tokens": 6906960} {"current_steps": 5290, "total_steps": 12855, "loss": 0.9869, "accuracy": 0.8999999761581421, "learning_rate": 3.186058461633271e-05, "epoch": 0.411513029949436, "percentage": 41.15, "elapsed_time": "2:27:00", "remaining_time": "3:30:13", "throughput": 784.24, "total_tokens": 6917440} {"current_steps": 5300, "total_steps": 12855, "loss": 0.8738, "accuracy": 0.800000011920929, "learning_rate": 3.180181304648902e-05, "epoch": 0.41229093737845196, "percentage": 41.23, "elapsed_time": "2:27:09", "remaining_time": "3:29:46", "throughput": 784.36, "total_tokens": 6925824} {"current_steps": 5310, "total_steps": 12855, "loss": 0.9261, "accuracy": 0.8999999761581421, "learning_rate": 3.17430008528909e-05, "epoch": 0.4130688448074679, "percentage": 41.31, "elapsed_time": "2:27:22", "remaining_time": "3:29:24", "throughput": 784.52, "total_tokens": 6937024} {"current_steps": 5320, "total_steps": 12855, "loss": 0.962, "accuracy": 0.699999988079071, "learning_rate": 3.168414838679356e-05, "epoch": 0.4138467522364839, "percentage": 41.38, "elapsed_time": "2:27:36", "remaining_time": "3:29:03", "throughput": 784.68, "total_tokens": 6949456} {"current_steps": 5330, "total_steps": 12855, "loss": 1.2351, "accuracy": 0.699999988079071, "learning_rate": 3.1625255999692707e-05, "epoch": 0.41462465966549983, "percentage": 41.46, "elapsed_time": "2:27:56", "remaining_time": "3:28:52", "throughput": 784.68, "total_tokens": 6965536} {"current_steps": 5340, "total_steps": 12855, "loss": 1.2494, "accuracy": 0.800000011920929, "learning_rate": 3.156632404332247e-05, "epoch": 0.41540256709451573, "percentage": 41.54, "elapsed_time": "2:28:17", "remaining_time": "3:28:41", "throughput": 784.71, "total_tokens": 6982160} {"current_steps": 5350, "total_steps": 12855, "loss": 0.8583, "accuracy": 1.0, "learning_rate": 3.1507352869653326e-05, "epoch": 0.4161804745235317, "percentage": 41.62, "elapsed_time": "2:28:43", "remaining_time": "3:28:38", "throughput": 784.45, "total_tokens": 7000208} {"current_steps": 5360, "total_steps": 12855, "loss": 0.6832, "accuracy": 0.8999999761581421, "learning_rate": 3.144834283088997e-05, "epoch": 0.41695838195254764, "percentage": 41.7, "elapsed_time": "2:29:03", "remaining_time": "3:28:25", "throughput": 784.4, "total_tokens": 7015120} {"current_steps": 5370, "total_steps": 12855, "loss": 0.9423, "accuracy": 0.8999999761581421, "learning_rate": 3.1389294279469215e-05, "epoch": 0.4177362893815636, "percentage": 41.77, "elapsed_time": "2:29:21", "remaining_time": "3:28:10", "throughput": 784.36, "total_tokens": 7028880} {"current_steps": 5380, "total_steps": 12855, "loss": 0.984, "accuracy": 0.699999988079071, "learning_rate": 3.133020756805789e-05, "epoch": 0.41851419681057955, "percentage": 41.85, "elapsed_time": "2:29:29", "remaining_time": "3:27:42", "throughput": 784.7, "total_tokens": 7038720} {"current_steps": 5390, "total_steps": 12855, "loss": 0.9056, "accuracy": 0.8999999761581421, "learning_rate": 3.1271083049550736e-05, "epoch": 0.4192921042395955, "percentage": 41.93, "elapsed_time": "2:29:45", "remaining_time": "3:27:24", "throughput": 784.91, "total_tokens": 7052992} {"current_steps": 5400, "total_steps": 12855, "loss": 0.837, "accuracy": 0.8999999761581421, "learning_rate": 3.12119210770683e-05, "epoch": 0.4200700116686114, "percentage": 42.01, "elapsed_time": "2:30:10", "remaining_time": "3:27:19", "throughput": 784.73, "total_tokens": 7071088} {"current_steps": 5410, "total_steps": 12855, "loss": 1.0268, "accuracy": 0.5, "learning_rate": 3.1152722003954815e-05, "epoch": 0.42084791909762737, "percentage": 42.08, "elapsed_time": "2:30:20", "remaining_time": "3:26:54", "throughput": 785.0, "total_tokens": 7081392} {"current_steps": 5420, "total_steps": 12855, "loss": 0.9555, "accuracy": 1.0, "learning_rate": 3.10934861837761e-05, "epoch": 0.4216258265266433, "percentage": 42.16, "elapsed_time": "2:30:32", "remaining_time": "3:26:30", "throughput": 785.32, "total_tokens": 7093248} {"current_steps": 5430, "total_steps": 12855, "loss": 1.0209, "accuracy": 0.8999999761581421, "learning_rate": 3.103421397031745e-05, "epoch": 0.4224037339556593, "percentage": 42.24, "elapsed_time": "2:31:12", "remaining_time": "3:26:45", "throughput": 783.95, "total_tokens": 7112240} {"current_steps": 5440, "total_steps": 12855, "loss": 0.7893, "accuracy": 1.0, "learning_rate": 3.097490571758151e-05, "epoch": 0.42318164138467523, "percentage": 42.32, "elapsed_time": "2:31:38", "remaining_time": "3:26:41", "throughput": 783.83, "total_tokens": 7131280} {"current_steps": 5450, "total_steps": 12855, "loss": 0.7227, "accuracy": 1.0, "learning_rate": 3.091556177978619e-05, "epoch": 0.4239595488136912, "percentage": 42.4, "elapsed_time": "2:31:58", "remaining_time": "3:26:28", "throughput": 783.71, "total_tokens": 7145920} {"current_steps": 5460, "total_steps": 12855, "loss": 0.9378, "accuracy": 1.0, "learning_rate": 3.08561825113625e-05, "epoch": 0.42473745624270715, "percentage": 42.47, "elapsed_time": "2:32:19", "remaining_time": "3:26:18", "throughput": 783.54, "total_tokens": 7161216} {"current_steps": 5470, "total_steps": 12855, "loss": 0.8656, "accuracy": 1.0, "learning_rate": 3.079676826695248e-05, "epoch": 0.42551536367172305, "percentage": 42.55, "elapsed_time": "2:32:32", "remaining_time": "3:25:56", "throughput": 783.7, "total_tokens": 7172848} {"current_steps": 5480, "total_steps": 12855, "loss": 0.9704, "accuracy": 0.699999988079071, "learning_rate": 3.0737319401407037e-05, "epoch": 0.426293271100739, "percentage": 42.63, "elapsed_time": "2:32:52", "remaining_time": "3:25:44", "throughput": 783.61, "total_tokens": 7187648} {"current_steps": 5490, "total_steps": 12855, "loss": 1.1696, "accuracy": 1.0, "learning_rate": 3.0677836269783895e-05, "epoch": 0.42707117852975496, "percentage": 42.71, "elapsed_time": "2:33:07", "remaining_time": "3:25:25", "throughput": 783.73, "total_tokens": 7200368} {"current_steps": 5500, "total_steps": 12855, "loss": 0.9635, "accuracy": 0.8999999761581421, "learning_rate": 3.061831922734541e-05, "epoch": 0.4278490859587709, "percentage": 42.78, "elapsed_time": "2:33:19", "remaining_time": "3:25:02", "throughput": 783.87, "total_tokens": 7211472} {"current_steps": 5510, "total_steps": 12855, "loss": 0.8666, "accuracy": 1.0, "learning_rate": 3.055876862955647e-05, "epoch": 0.42862699338778687, "percentage": 42.86, "elapsed_time": "2:33:30", "remaining_time": "3:24:38", "throughput": 784.16, "total_tokens": 7222832} {"current_steps": 5520, "total_steps": 12855, "loss": 0.9139, "accuracy": 1.0, "learning_rate": 3.0499184832082362e-05, "epoch": 0.4294049008168028, "percentage": 42.94, "elapsed_time": "2:33:41", "remaining_time": "3:24:13", "throughput": 784.35, "total_tokens": 7232992} {"current_steps": 5530, "total_steps": 12855, "loss": 0.8556, "accuracy": 0.800000011920929, "learning_rate": 3.0439568190786682e-05, "epoch": 0.4301828082458187, "percentage": 43.02, "elapsed_time": "2:33:48", "remaining_time": "3:23:43", "throughput": 784.73, "total_tokens": 7241760} {"current_steps": 5540, "total_steps": 12855, "loss": 0.8981, "accuracy": 0.8999999761581421, "learning_rate": 3.0379919061729168e-05, "epoch": 0.4309607156748347, "percentage": 43.1, "elapsed_time": "2:34:02", "remaining_time": "3:23:23", "throughput": 785.0, "total_tokens": 7254960} {"current_steps": 5550, "total_steps": 12855, "loss": 0.7485, "accuracy": 1.0, "learning_rate": 3.032023780116358e-05, "epoch": 0.43173862310385064, "percentage": 43.17, "elapsed_time": "2:34:27", "remaining_time": "3:23:17", "throughput": 784.81, "total_tokens": 7273088} {"current_steps": 5560, "total_steps": 12855, "loss": 0.8194, "accuracy": 1.0, "learning_rate": 3.026052476553561e-05, "epoch": 0.4325165305328666, "percentage": 43.25, "elapsed_time": "2:34:39", "remaining_time": "3:22:55", "throughput": 785.15, "total_tokens": 7286160} {"current_steps": 5570, "total_steps": 12855, "loss": 1.1695, "accuracy": 1.0, "learning_rate": 3.0200780311480716e-05, "epoch": 0.43329443796188255, "percentage": 43.33, "elapsed_time": "2:34:54", "remaining_time": "3:22:36", "throughput": 785.15, "total_tokens": 7297920} {"current_steps": 5580, "total_steps": 12855, "loss": 1.1741, "accuracy": 1.0, "learning_rate": 3.0141004795821992e-05, "epoch": 0.4340723453908985, "percentage": 43.41, "elapsed_time": "2:35:13", "remaining_time": "3:22:23", "throughput": 785.01, "total_tokens": 7311472} {"current_steps": 5590, "total_steps": 12855, "loss": 0.9199, "accuracy": 0.8999999761581421, "learning_rate": 3.008119857556807e-05, "epoch": 0.4348502528199144, "percentage": 43.49, "elapsed_time": "2:35:26", "remaining_time": "3:22:01", "throughput": 785.05, "total_tokens": 7322080} {"current_steps": 5600, "total_steps": 12855, "loss": 1.1625, "accuracy": 1.0, "learning_rate": 3.002136200791093e-05, "epoch": 0.43562816024893036, "percentage": 43.56, "elapsed_time": "2:35:48", "remaining_time": "3:21:51", "throughput": 784.83, "total_tokens": 7337232} {"current_steps": 5610, "total_steps": 12855, "loss": 0.9769, "accuracy": 0.8999999761581421, "learning_rate": 2.996149545022383e-05, "epoch": 0.4364060676779463, "percentage": 43.64, "elapsed_time": "2:36:00", "remaining_time": "3:21:28", "throughput": 784.93, "total_tokens": 7347408} {"current_steps": 5620, "total_steps": 12855, "loss": 1.0359, "accuracy": 1.0, "learning_rate": 2.990159926005913e-05, "epoch": 0.4371839751069623, "percentage": 43.72, "elapsed_time": "2:36:20", "remaining_time": "3:21:15", "throughput": 784.89, "total_tokens": 7362448} {"current_steps": 5630, "total_steps": 12855, "loss": 1.0562, "accuracy": 0.8999999761581421, "learning_rate": 2.984167379514618e-05, "epoch": 0.43796188253597823, "percentage": 43.8, "elapsed_time": "2:36:38", "remaining_time": "3:21:01", "throughput": 784.9, "total_tokens": 7377168} {"current_steps": 5640, "total_steps": 12855, "loss": 0.9189, "accuracy": 0.800000011920929, "learning_rate": 2.978171941338917e-05, "epoch": 0.4387397899649942, "percentage": 43.87, "elapsed_time": "2:36:51", "remaining_time": "3:20:40", "throughput": 785.3, "total_tokens": 7391184} {"current_steps": 5650, "total_steps": 12855, "loss": 1.8715, "accuracy": 0.8999999761581421, "learning_rate": 2.972173647286499e-05, "epoch": 0.4395176973940101, "percentage": 43.95, "elapsed_time": "2:37:08", "remaining_time": "3:20:24", "throughput": 785.38, "total_tokens": 7405376} {"current_steps": 5660, "total_steps": 12855, "loss": 1.9488, "accuracy": 0.699999988079071, "learning_rate": 2.96617253318211e-05, "epoch": 0.44029560482302604, "percentage": 44.03, "elapsed_time": "2:37:26", "remaining_time": "3:20:08", "throughput": 785.41, "total_tokens": 7419312} {"current_steps": 5670, "total_steps": 12855, "loss": 1.1235, "accuracy": 1.0, "learning_rate": 2.960168634867338e-05, "epoch": 0.441073512252042, "percentage": 44.11, "elapsed_time": "2:37:42", "remaining_time": "3:19:51", "throughput": 785.47, "total_tokens": 7432704} {"current_steps": 5680, "total_steps": 12855, "loss": 0.8774, "accuracy": 0.8999999761581421, "learning_rate": 2.9541619882004007e-05, "epoch": 0.44185141968105796, "percentage": 44.19, "elapsed_time": "2:37:59", "remaining_time": "3:19:34", "throughput": 785.61, "total_tokens": 7447376} {"current_steps": 5690, "total_steps": 12855, "loss": 1.026, "accuracy": 0.8999999761581421, "learning_rate": 2.9481526290559298e-05, "epoch": 0.4426293271100739, "percentage": 44.26, "elapsed_time": "2:38:09", "remaining_time": "3:19:09", "throughput": 785.91, "total_tokens": 7457856} {"current_steps": 5700, "total_steps": 12855, "loss": 0.9163, "accuracy": 0.8999999761581421, "learning_rate": 2.9421405933247582e-05, "epoch": 0.44340723453908987, "percentage": 44.34, "elapsed_time": "2:38:21", "remaining_time": "3:18:47", "throughput": 786.11, "total_tokens": 7469360} {"current_steps": 5710, "total_steps": 12855, "loss": 1.139, "accuracy": 1.0, "learning_rate": 2.936125916913704e-05, "epoch": 0.44418514196810577, "percentage": 44.42, "elapsed_time": "2:38:31", "remaining_time": "3:18:21", "throughput": 786.32, "total_tokens": 7478880} {"current_steps": 5720, "total_steps": 12855, "loss": 1.0214, "accuracy": 0.8999999761581421, "learning_rate": 2.9301086357453557e-05, "epoch": 0.4449630493971217, "percentage": 44.5, "elapsed_time": "2:38:52", "remaining_time": "3:18:10", "throughput": 786.34, "total_tokens": 7495696} {"current_steps": 5730, "total_steps": 12855, "loss": 0.7909, "accuracy": 1.0, "learning_rate": 2.9240887857578597e-05, "epoch": 0.4457409568261377, "percentage": 44.57, "elapsed_time": "2:39:05", "remaining_time": "3:17:48", "throughput": 786.48, "total_tokens": 7507056} {"current_steps": 5740, "total_steps": 12855, "loss": 0.7787, "accuracy": 0.8999999761581421, "learning_rate": 2.918066402904705e-05, "epoch": 0.44651886425515364, "percentage": 44.65, "elapsed_time": "2:39:14", "remaining_time": "3:17:23", "throughput": 786.75, "total_tokens": 7517136} {"current_steps": 5750, "total_steps": 12855, "loss": 0.9802, "accuracy": 1.0, "learning_rate": 2.9120415231545066e-05, "epoch": 0.4472967716841696, "percentage": 44.73, "elapsed_time": "2:39:30", "remaining_time": "3:17:05", "throughput": 786.85, "total_tokens": 7530208} {"current_steps": 5760, "total_steps": 12855, "loss": 0.9545, "accuracy": 1.0, "learning_rate": 2.906014182490795e-05, "epoch": 0.44807467911318555, "percentage": 44.81, "elapsed_time": "2:39:46", "remaining_time": "3:16:47", "throughput": 786.99, "total_tokens": 7544272} {"current_steps": 5770, "total_steps": 12855, "loss": 0.8435, "accuracy": 1.0, "learning_rate": 2.8999844169117958e-05, "epoch": 0.4488525865422015, "percentage": 44.89, "elapsed_time": "2:40:05", "remaining_time": "3:16:34", "throughput": 786.92, "total_tokens": 7558480} {"current_steps": 5780, "total_steps": 12855, "loss": 1.0583, "accuracy": 0.800000011920929, "learning_rate": 2.893952262430219e-05, "epoch": 0.4496304939712174, "percentage": 44.96, "elapsed_time": "2:40:21", "remaining_time": "3:16:16", "throughput": 787.01, "total_tokens": 7572112} {"current_steps": 5790, "total_steps": 12855, "loss": 0.847, "accuracy": 0.8999999761581421, "learning_rate": 2.8879177550730407e-05, "epoch": 0.45040840140023336, "percentage": 45.04, "elapsed_time": "2:40:37", "remaining_time": "3:15:59", "throughput": 787.1, "total_tokens": 7585360} {"current_steps": 5800, "total_steps": 12855, "loss": 1.0204, "accuracy": 0.8999999761581421, "learning_rate": 2.8818809308812906e-05, "epoch": 0.4511863088292493, "percentage": 45.12, "elapsed_time": "2:40:52", "remaining_time": "3:15:41", "throughput": 787.31, "total_tokens": 7599648} {"current_steps": 5810, "total_steps": 12855, "loss": 0.7841, "accuracy": 1.0, "learning_rate": 2.875841825909835e-05, "epoch": 0.45196421625826527, "percentage": 45.2, "elapsed_time": "2:41:00", "remaining_time": "3:15:14", "throughput": 787.46, "total_tokens": 7607328} {"current_steps": 5820, "total_steps": 12855, "loss": 1.161, "accuracy": 1.0, "learning_rate": 2.8698004762271634e-05, "epoch": 0.45274212368728123, "percentage": 45.27, "elapsed_time": "2:41:14", "remaining_time": "3:14:54", "throughput": 787.6, "total_tokens": 7619840} {"current_steps": 5830, "total_steps": 12855, "loss": 0.9073, "accuracy": 1.0, "learning_rate": 2.8637569179151714e-05, "epoch": 0.4535200311162972, "percentage": 45.35, "elapsed_time": "2:41:29", "remaining_time": "3:14:35", "throughput": 787.77, "total_tokens": 7632912} {"current_steps": 5840, "total_steps": 12855, "loss": 0.9031, "accuracy": 1.0, "learning_rate": 2.8577111870689454e-05, "epoch": 0.4542979385453131, "percentage": 45.43, "elapsed_time": "2:41:43", "remaining_time": "3:14:16", "throughput": 787.84, "total_tokens": 7645040} {"current_steps": 5850, "total_steps": 12855, "loss": 1.116, "accuracy": 1.0, "learning_rate": 2.8516633197965458e-05, "epoch": 0.45507584597432904, "percentage": 45.51, "elapsed_time": "2:42:01", "remaining_time": "3:14:00", "throughput": 787.96, "total_tokens": 7659872} {"current_steps": 5860, "total_steps": 12855, "loss": 0.904, "accuracy": 1.0, "learning_rate": 2.845613352218795e-05, "epoch": 0.455853753403345, "percentage": 45.59, "elapsed_time": "2:42:20", "remaining_time": "3:13:47", "throughput": 787.93, "total_tokens": 7675120} {"current_steps": 5870, "total_steps": 12855, "loss": 0.8221, "accuracy": 0.8999999761581421, "learning_rate": 2.839561320469058e-05, "epoch": 0.45663166083236095, "percentage": 45.66, "elapsed_time": "2:42:41", "remaining_time": "3:13:35", "throughput": 787.85, "total_tokens": 7690256} {"current_steps": 5880, "total_steps": 12855, "loss": 1.1136, "accuracy": 1.0, "learning_rate": 2.8335072606930287e-05, "epoch": 0.4574095682613769, "percentage": 45.74, "elapsed_time": "2:43:00", "remaining_time": "3:13:21", "throughput": 787.57, "total_tokens": 7702640} {"current_steps": 5890, "total_steps": 12855, "loss": 0.996, "accuracy": 0.800000011920929, "learning_rate": 2.827451209048514e-05, "epoch": 0.45818747569039286, "percentage": 45.82, "elapsed_time": "2:43:10", "remaining_time": "3:12:57", "throughput": 787.83, "total_tokens": 7713392} {"current_steps": 5900, "total_steps": 12855, "loss": 0.843, "accuracy": 1.0, "learning_rate": 2.8213932017052164e-05, "epoch": 0.45896538311940877, "percentage": 45.9, "elapsed_time": "2:43:21", "remaining_time": "3:12:34", "throughput": 787.99, "total_tokens": 7723536} {"current_steps": 5910, "total_steps": 12855, "loss": 0.8648, "accuracy": 0.8999999761581421, "learning_rate": 2.8153332748445178e-05, "epoch": 0.4597432905484247, "percentage": 45.97, "elapsed_time": "2:43:31", "remaining_time": "3:12:09", "throughput": 788.22, "total_tokens": 7733392} {"current_steps": 5920, "total_steps": 12855, "loss": 0.9214, "accuracy": 0.8999999761581421, "learning_rate": 2.8092714646592654e-05, "epoch": 0.4605211979774407, "percentage": 46.05, "elapsed_time": "2:43:45", "remaining_time": "3:11:50", "throughput": 788.32, "total_tokens": 7745856} {"current_steps": 5930, "total_steps": 12855, "loss": 0.6876, "accuracy": 0.8999999761581421, "learning_rate": 2.803207807353556e-05, "epoch": 0.46129910540645663, "percentage": 46.13, "elapsed_time": "2:44:01", "remaining_time": "3:11:32", "throughput": 788.48, "total_tokens": 7759568} {"current_steps": 5940, "total_steps": 12855, "loss": 1.0659, "accuracy": 0.8999999761581421, "learning_rate": 2.7971423391425154e-05, "epoch": 0.4620770128354726, "percentage": 46.21, "elapsed_time": "2:44:18", "remaining_time": "3:11:16", "throughput": 788.64, "total_tokens": 7774960} {"current_steps": 5950, "total_steps": 12855, "loss": 0.6976, "accuracy": 0.8999999761581421, "learning_rate": 2.7910750962520872e-05, "epoch": 0.46285492026448855, "percentage": 46.29, "elapsed_time": "2:44:33", "remaining_time": "3:10:58", "throughput": 788.64, "total_tokens": 7786784} {"current_steps": 5960, "total_steps": 12855, "loss": 1.0446, "accuracy": 0.8999999761581421, "learning_rate": 2.7850061149188146e-05, "epoch": 0.46363282769350445, "percentage": 46.36, "elapsed_time": "2:44:48", "remaining_time": "3:10:39", "throughput": 788.77, "total_tokens": 7799360} {"current_steps": 5970, "total_steps": 12855, "loss": 0.8972, "accuracy": 0.8999999761581421, "learning_rate": 2.7789354313896203e-05, "epoch": 0.4644107351225204, "percentage": 46.44, "elapsed_time": "2:45:10", "remaining_time": "3:10:29", "throughput": 788.62, "total_tokens": 7815408} {"current_steps": 5980, "total_steps": 12855, "loss": 1.0319, "accuracy": 0.800000011920929, "learning_rate": 2.7728630819215978e-05, "epoch": 0.46518864255153636, "percentage": 46.52, "elapsed_time": "2:45:23", "remaining_time": "3:10:08", "throughput": 788.71, "total_tokens": 7826352} {"current_steps": 5990, "total_steps": 12855, "loss": 0.7815, "accuracy": 0.8999999761581421, "learning_rate": 2.7667891027817865e-05, "epoch": 0.4659665499805523, "percentage": 46.6, "elapsed_time": "2:45:30", "remaining_time": "3:09:41", "throughput": 788.84, "total_tokens": 7833904} {"current_steps": 6000, "total_steps": 12855, "loss": 1.6485, "accuracy": 0.800000011920929, "learning_rate": 2.7607135302469615e-05, "epoch": 0.46674445740956827, "percentage": 46.67, "elapsed_time": "2:45:55", "remaining_time": "3:09:34", "throughput": 788.55, "total_tokens": 7850688} {"current_steps": 6010, "total_steps": 12855, "loss": 0.8854, "accuracy": 0.8999999761581421, "learning_rate": 2.7546364006034137e-05, "epoch": 0.4675223648385842, "percentage": 46.75, "elapsed_time": "2:46:16", "remaining_time": "3:09:22", "throughput": 788.12, "total_tokens": 7862704} {"current_steps": 6020, "total_steps": 12855, "loss": 0.849, "accuracy": 0.8999999761581421, "learning_rate": 2.7485577501467337e-05, "epoch": 0.4683002722676002, "percentage": 46.83, "elapsed_time": "2:46:32", "remaining_time": "3:09:05", "throughput": 788.2, "total_tokens": 7876240} {"current_steps": 6030, "total_steps": 12855, "loss": 1.0526, "accuracy": 1.0, "learning_rate": 2.742477615181596e-05, "epoch": 0.4690781796966161, "percentage": 46.91, "elapsed_time": "2:46:42", "remaining_time": "3:08:40", "throughput": 788.39, "total_tokens": 7885536} {"current_steps": 6040, "total_steps": 12855, "loss": 0.6009, "accuracy": 1.0, "learning_rate": 2.7363960320215393e-05, "epoch": 0.46985608712563204, "percentage": 46.99, "elapsed_time": "2:46:59", "remaining_time": "3:08:25", "throughput": 788.25, "total_tokens": 7898160} {"current_steps": 6050, "total_steps": 12855, "loss": 0.9212, "accuracy": 0.8999999761581421, "learning_rate": 2.730313036988753e-05, "epoch": 0.470633994554648, "percentage": 47.06, "elapsed_time": "2:47:15", "remaining_time": "3:08:07", "throughput": 788.29, "total_tokens": 7910608} {"current_steps": 6060, "total_steps": 12855, "loss": 0.7449, "accuracy": 0.8999999761581421, "learning_rate": 2.7242286664138595e-05, "epoch": 0.47141190198366395, "percentage": 47.14, "elapsed_time": "2:47:28", "remaining_time": "3:07:47", "throughput": 788.55, "total_tokens": 7923776} {"current_steps": 6070, "total_steps": 12855, "loss": 0.8009, "accuracy": 1.0, "learning_rate": 2.7181429566356952e-05, "epoch": 0.4721898094126799, "percentage": 47.22, "elapsed_time": "2:47:40", "remaining_time": "3:07:25", "throughput": 788.71, "total_tokens": 7934848} {"current_steps": 6080, "total_steps": 12855, "loss": 0.9441, "accuracy": 1.0, "learning_rate": 2.712055944001095e-05, "epoch": 0.47296771684169586, "percentage": 47.3, "elapsed_time": "2:47:52", "remaining_time": "3:07:03", "throughput": 788.95, "total_tokens": 7946752} {"current_steps": 6090, "total_steps": 12855, "loss": 0.9719, "accuracy": 0.8999999761581421, "learning_rate": 2.705967664864678e-05, "epoch": 0.47374562427071176, "percentage": 47.37, "elapsed_time": "2:48:06", "remaining_time": "3:06:44", "throughput": 789.07, "total_tokens": 7959040} {"current_steps": 6100, "total_steps": 12855, "loss": 0.8161, "accuracy": 1.0, "learning_rate": 2.6998781555886227e-05, "epoch": 0.4745235316997277, "percentage": 47.45, "elapsed_time": "2:48:19", "remaining_time": "3:06:24", "throughput": 789.35, "total_tokens": 7972240} {"current_steps": 6110, "total_steps": 12855, "loss": 1.2286, "accuracy": 0.800000011920929, "learning_rate": 2.6937874525424577e-05, "epoch": 0.4753014391287437, "percentage": 47.53, "elapsed_time": "2:48:40", "remaining_time": "3:06:12", "throughput": 789.22, "total_tokens": 7987488} {"current_steps": 6120, "total_steps": 12855, "loss": 0.7285, "accuracy": 1.0, "learning_rate": 2.6876955921028408e-05, "epoch": 0.47607934655775963, "percentage": 47.61, "elapsed_time": "2:48:52", "remaining_time": "3:05:50", "throughput": 789.45, "total_tokens": 7998720} {"current_steps": 6130, "total_steps": 12855, "loss": 0.878, "accuracy": 1.0, "learning_rate": 2.6816026106533428e-05, "epoch": 0.4768572539867756, "percentage": 47.69, "elapsed_time": "2:49:15", "remaining_time": "3:05:41", "throughput": 789.39, "total_tokens": 8016608} {"current_steps": 6140, "total_steps": 12855, "loss": 0.8433, "accuracy": 0.800000011920929, "learning_rate": 2.6755085445842276e-05, "epoch": 0.47763516141579154, "percentage": 47.76, "elapsed_time": "2:49:30", "remaining_time": "3:05:23", "throughput": 789.52, "total_tokens": 8029872} {"current_steps": 6150, "total_steps": 12855, "loss": 0.9548, "accuracy": 1.0, "learning_rate": 2.6694134302922396e-05, "epoch": 0.47841306884480744, "percentage": 47.84, "elapsed_time": "2:49:48", "remaining_time": "3:05:08", "throughput": 789.61, "total_tokens": 8045200} {"current_steps": 6160, "total_steps": 12855, "loss": 0.8676, "accuracy": 1.0, "learning_rate": 2.6633173041803828e-05, "epoch": 0.4791909762738234, "percentage": 47.92, "elapsed_time": "2:50:06", "remaining_time": "3:04:53", "throughput": 789.77, "total_tokens": 8060896} {"current_steps": 6170, "total_steps": 12855, "loss": 0.7677, "accuracy": 1.0, "learning_rate": 2.6572202026577036e-05, "epoch": 0.47996888370283936, "percentage": 48.0, "elapsed_time": "2:50:23", "remaining_time": "3:04:36", "throughput": 789.8, "total_tokens": 8074224} {"current_steps": 6180, "total_steps": 12855, "loss": 0.996, "accuracy": 0.800000011920929, "learning_rate": 2.651122162139074e-05, "epoch": 0.4807467911318553, "percentage": 48.07, "elapsed_time": "2:50:40", "remaining_time": "3:04:21", "throughput": 789.8, "total_tokens": 8088144} {"current_steps": 6190, "total_steps": 12855, "loss": 0.8474, "accuracy": 1.0, "learning_rate": 2.6450232190449758e-05, "epoch": 0.48152469856087127, "percentage": 48.15, "elapsed_time": "2:50:59", "remaining_time": "3:04:06", "throughput": 789.71, "total_tokens": 8101824} {"current_steps": 6200, "total_steps": 12855, "loss": 1.0605, "accuracy": 0.8999999761581421, "learning_rate": 2.6389234098012792e-05, "epoch": 0.4823026059898872, "percentage": 48.23, "elapsed_time": "2:51:21", "remaining_time": "3:03:56", "throughput": 789.68, "total_tokens": 8119472} {"current_steps": 6210, "total_steps": 12855, "loss": 0.7782, "accuracy": 0.8999999761581421, "learning_rate": 2.6328227708390297e-05, "epoch": 0.4830805134189031, "percentage": 48.31, "elapsed_time": "2:51:38", "remaining_time": "3:03:39", "throughput": 789.75, "total_tokens": 8133248} {"current_steps": 6220, "total_steps": 12855, "loss": 1.2817, "accuracy": 1.0, "learning_rate": 2.6267213385942262e-05, "epoch": 0.4838584208479191, "percentage": 48.39, "elapsed_time": "2:51:58", "remaining_time": "3:03:27", "throughput": 789.75, "total_tokens": 8149296} {"current_steps": 6230, "total_steps": 12855, "loss": 0.9965, "accuracy": 1.0, "learning_rate": 2.6206191495076065e-05, "epoch": 0.48463632827693504, "percentage": 48.46, "elapsed_time": "2:52:20", "remaining_time": "3:03:16", "throughput": 789.6, "total_tokens": 8165152} {"current_steps": 6240, "total_steps": 12855, "loss": 0.9536, "accuracy": 0.699999988079071, "learning_rate": 2.614516240024429e-05, "epoch": 0.485414235705951, "percentage": 48.54, "elapsed_time": "2:52:34", "remaining_time": "3:02:56", "throughput": 789.82, "total_tokens": 8177776} {"current_steps": 6250, "total_steps": 12855, "loss": 0.9641, "accuracy": 0.8999999761581421, "learning_rate": 2.608412646594254e-05, "epoch": 0.48619214313496695, "percentage": 48.62, "elapsed_time": "2:52:50", "remaining_time": "3:02:39", "throughput": 789.95, "total_tokens": 8192080} {"current_steps": 6260, "total_steps": 12855, "loss": 0.7637, "accuracy": 0.8999999761581421, "learning_rate": 2.6023084056707258e-05, "epoch": 0.4869700505639829, "percentage": 48.7, "elapsed_time": "2:53:06", "remaining_time": "3:02:22", "throughput": 789.94, "total_tokens": 8204656} {"current_steps": 6270, "total_steps": 12855, "loss": 0.9785, "accuracy": 0.8999999761581421, "learning_rate": 2.596203553711359e-05, "epoch": 0.48774795799299886, "percentage": 48.77, "elapsed_time": "2:53:21", "remaining_time": "3:02:04", "throughput": 789.97, "total_tokens": 8216896} {"current_steps": 6280, "total_steps": 12855, "loss": 0.8551, "accuracy": 0.8999999761581421, "learning_rate": 2.5900981271773133e-05, "epoch": 0.48852586542201476, "percentage": 48.85, "elapsed_time": "2:53:43", "remaining_time": "3:01:52", "throughput": 789.78, "total_tokens": 8232096} {"current_steps": 6290, "total_steps": 12855, "loss": 2.2166, "accuracy": 0.800000011920929, "learning_rate": 2.5839921625331842e-05, "epoch": 0.4893037728510307, "percentage": 48.93, "elapsed_time": "2:53:51", "remaining_time": "3:01:27", "throughput": 790.01, "total_tokens": 8241072} {"current_steps": 6300, "total_steps": 12855, "loss": 0.9603, "accuracy": 0.8999999761581421, "learning_rate": 2.5778856962467777e-05, "epoch": 0.49008168028004667, "percentage": 49.01, "elapsed_time": "2:53:59", "remaining_time": "3:01:02", "throughput": 790.18, "total_tokens": 8249264} {"current_steps": 6310, "total_steps": 12855, "loss": 0.9124, "accuracy": 0.8999999761581421, "learning_rate": 2.571778764788898e-05, "epoch": 0.49085958770906263, "percentage": 49.09, "elapsed_time": "2:54:16", "remaining_time": "3:00:46", "throughput": 790.15, "total_tokens": 8262368} {"current_steps": 6320, "total_steps": 12855, "loss": 0.9271, "accuracy": 1.0, "learning_rate": 2.5656714046331265e-05, "epoch": 0.4916374951380786, "percentage": 49.16, "elapsed_time": "2:54:32", "remaining_time": "3:00:28", "throughput": 790.05, "total_tokens": 8273760} {"current_steps": 6330, "total_steps": 12855, "loss": 0.8607, "accuracy": 0.8999999761581421, "learning_rate": 2.559563652255605e-05, "epoch": 0.49241540256709454, "percentage": 49.24, "elapsed_time": "2:54:45", "remaining_time": "3:00:08", "throughput": 790.21, "total_tokens": 8285680} {"current_steps": 6340, "total_steps": 12855, "loss": 0.9345, "accuracy": 0.8999999761581421, "learning_rate": 2.553455544134819e-05, "epoch": 0.49319330999611044, "percentage": 49.32, "elapsed_time": "2:54:58", "remaining_time": "2:59:48", "throughput": 790.33, "total_tokens": 8297488} {"current_steps": 6350, "total_steps": 12855, "loss": 0.9277, "accuracy": 1.0, "learning_rate": 2.547347116751377e-05, "epoch": 0.4939712174251264, "percentage": 49.4, "elapsed_time": "2:55:11", "remaining_time": "2:59:28", "throughput": 790.41, "total_tokens": 8308768} {"current_steps": 6360, "total_steps": 12855, "loss": 0.9766, "accuracy": 0.8999999761581421, "learning_rate": 2.5412384065877954e-05, "epoch": 0.49474912485414235, "percentage": 49.47, "elapsed_time": "2:55:25", "remaining_time": "2:59:08", "throughput": 790.58, "total_tokens": 8321168} {"current_steps": 6370, "total_steps": 12855, "loss": 1.0673, "accuracy": 0.8999999761581421, "learning_rate": 2.5351294501282785e-05, "epoch": 0.4955270322831583, "percentage": 49.55, "elapsed_time": "2:55:45", "remaining_time": "2:58:55", "throughput": 790.63, "total_tokens": 8337456} {"current_steps": 6380, "total_steps": 12855, "loss": 1.1561, "accuracy": 0.800000011920929, "learning_rate": 2.5290202838585036e-05, "epoch": 0.49630493971217426, "percentage": 49.63, "elapsed_time": "2:55:55", "remaining_time": "2:58:32", "throughput": 790.76, "total_tokens": 8347088} {"current_steps": 6390, "total_steps": 12855, "loss": 0.8428, "accuracy": 1.0, "learning_rate": 2.522910944265399e-05, "epoch": 0.4970828471411902, "percentage": 49.71, "elapsed_time": "2:56:10", "remaining_time": "2:58:14", "throughput": 790.97, "total_tokens": 8361040} {"current_steps": 6400, "total_steps": 12855, "loss": 1.0255, "accuracy": 0.800000011920929, "learning_rate": 2.516801467836929e-05, "epoch": 0.4978607545702061, "percentage": 49.79, "elapsed_time": "2:56:19", "remaining_time": "2:57:50", "throughput": 791.05, "total_tokens": 8369088} {"current_steps": 6410, "total_steps": 12855, "loss": 1.0829, "accuracy": 0.8999999761581421, "learning_rate": 2.510691891061875e-05, "epoch": 0.4986386619992221, "percentage": 49.86, "elapsed_time": "2:56:31", "remaining_time": "2:57:28", "throughput": 791.09, "total_tokens": 8378512} {"current_steps": 6420, "total_steps": 12855, "loss": 0.8362, "accuracy": 0.800000011920929, "learning_rate": 2.504582250429618e-05, "epoch": 0.49941656942823803, "percentage": 49.94, "elapsed_time": "2:56:51", "remaining_time": "2:57:16", "throughput": 790.94, "total_tokens": 8393488} {"current_steps": 6430, "total_steps": 12855, "loss": 0.899, "accuracy": 0.800000011920929, "learning_rate": 2.498472582429921e-05, "epoch": 0.5001944768572539, "percentage": 50.02, "elapsed_time": "2:57:09", "remaining_time": "2:57:01", "throughput": 790.94, "total_tokens": 8407136} {"current_steps": 6440, "total_steps": 12855, "loss": 0.9596, "accuracy": 0.699999988079071, "learning_rate": 2.4923629235527078e-05, "epoch": 0.5009723842862699, "percentage": 50.1, "elapsed_time": "2:57:44", "remaining_time": "2:57:03", "throughput": 790.07, "total_tokens": 8425696} {"current_steps": 6450, "total_steps": 12855, "loss": 1.5676, "accuracy": 0.800000011920929, "learning_rate": 2.486253310287851e-05, "epoch": 0.5017502917152858, "percentage": 50.18, "elapsed_time": "2:57:59", "remaining_time": "2:56:45", "throughput": 790.2, "total_tokens": 8439280} {"current_steps": 6460, "total_steps": 12855, "loss": 0.7902, "accuracy": 1.0, "learning_rate": 2.4801437791249482e-05, "epoch": 0.5025281991443018, "percentage": 50.25, "elapsed_time": "2:58:24", "remaining_time": "2:56:36", "throughput": 789.99, "total_tokens": 8456080} {"current_steps": 6470, "total_steps": 12855, "loss": 0.8267, "accuracy": 1.0, "learning_rate": 2.4740343665531092e-05, "epoch": 0.5033061065733178, "percentage": 50.33, "elapsed_time": "2:58:37", "remaining_time": "2:56:17", "throughput": 790.17, "total_tokens": 8468992} {"current_steps": 6480, "total_steps": 12855, "loss": 0.9399, "accuracy": 1.0, "learning_rate": 2.4679251090607333e-05, "epoch": 0.5040840140023337, "percentage": 50.41, "elapsed_time": "2:58:51", "remaining_time": "2:55:57", "throughput": 790.33, "total_tokens": 8481024} {"current_steps": 6490, "total_steps": 12855, "loss": 0.9011, "accuracy": 1.0, "learning_rate": 2.4618160431352946e-05, "epoch": 0.5048619214313497, "percentage": 50.49, "elapsed_time": "2:59:07", "remaining_time": "2:55:40", "throughput": 790.19, "total_tokens": 8492816} {"current_steps": 6500, "total_steps": 12855, "loss": 1.0465, "accuracy": 1.0, "learning_rate": 2.455707205263123e-05, "epoch": 0.5056398288603656, "percentage": 50.56, "elapsed_time": "2:59:30", "remaining_time": "2:55:30", "throughput": 790.03, "total_tokens": 8509136} {"current_steps": 6510, "total_steps": 12855, "loss": 0.9967, "accuracy": 0.8999999761581421, "learning_rate": 2.4495986319291857e-05, "epoch": 0.5064177362893816, "percentage": 50.64, "elapsed_time": "2:59:47", "remaining_time": "2:55:13", "throughput": 790.02, "total_tokens": 8522096} {"current_steps": 6520, "total_steps": 12855, "loss": 0.838, "accuracy": 1.0, "learning_rate": 2.443490359616871e-05, "epoch": 0.5071956437183975, "percentage": 50.72, "elapsed_time": "3:00:13", "remaining_time": "2:55:06", "throughput": 789.65, "total_tokens": 8538672} {"current_steps": 6530, "total_steps": 12855, "loss": 1.0419, "accuracy": 0.8999999761581421, "learning_rate": 2.437382424807769e-05, "epoch": 0.5079735511474135, "percentage": 50.8, "elapsed_time": "3:00:27", "remaining_time": "2:54:47", "throughput": 789.66, "total_tokens": 8550192} {"current_steps": 6540, "total_steps": 12855, "loss": 0.8795, "accuracy": 1.0, "learning_rate": 2.431274863981453e-05, "epoch": 0.5087514585764294, "percentage": 50.88, "elapsed_time": "3:00:39", "remaining_time": "2:54:26", "throughput": 789.85, "total_tokens": 8561584} {"current_steps": 6550, "total_steps": 12855, "loss": 0.823, "accuracy": 1.0, "learning_rate": 2.4251677136152642e-05, "epoch": 0.5095293660054454, "percentage": 50.95, "elapsed_time": "3:00:47", "remaining_time": "2:54:02", "throughput": 790.04, "total_tokens": 8570304} {"current_steps": 6560, "total_steps": 12855, "loss": 0.976, "accuracy": 0.800000011920929, "learning_rate": 2.419061010184093e-05, "epoch": 0.5103072734344613, "percentage": 51.03, "elapsed_time": "3:00:56", "remaining_time": "2:53:37", "throughput": 790.33, "total_tokens": 8580016} {"current_steps": 6570, "total_steps": 12855, "loss": 0.6732, "accuracy": 0.8999999761581421, "learning_rate": 2.412954790160157e-05, "epoch": 0.5110851808634772, "percentage": 51.11, "elapsed_time": "3:01:09", "remaining_time": "2:53:17", "throughput": 790.52, "total_tokens": 8592208} {"current_steps": 6580, "total_steps": 12855, "loss": 1.2255, "accuracy": 0.8999999761581421, "learning_rate": 2.4068490900127894e-05, "epoch": 0.5118630882924932, "percentage": 51.19, "elapsed_time": "3:01:20", "remaining_time": "2:52:56", "throughput": 790.72, "total_tokens": 8603552} {"current_steps": 6590, "total_steps": 12855, "loss": 0.9537, "accuracy": 1.0, "learning_rate": 2.4007439462082175e-05, "epoch": 0.5126409957215091, "percentage": 51.26, "elapsed_time": "3:01:44", "remaining_time": "2:52:47", "throughput": 790.56, "total_tokens": 8620960} {"current_steps": 6600, "total_steps": 12855, "loss": 0.9641, "accuracy": 1.0, "learning_rate": 2.394639395209348e-05, "epoch": 0.5134189031505251, "percentage": 51.34, "elapsed_time": "3:01:55", "remaining_time": "2:52:25", "throughput": 790.67, "total_tokens": 8630704} {"current_steps": 6610, "total_steps": 12855, "loss": 0.9, "accuracy": 0.8999999761581421, "learning_rate": 2.388535473475544e-05, "epoch": 0.514196810579541, "percentage": 51.42, "elapsed_time": "3:02:12", "remaining_time": "2:52:09", "throughput": 790.75, "total_tokens": 8645168} {"current_steps": 6620, "total_steps": 12855, "loss": 0.679, "accuracy": 1.0, "learning_rate": 2.382432217462412e-05, "epoch": 0.514974718008557, "percentage": 51.5, "elapsed_time": "3:02:45", "remaining_time": "2:52:07", "throughput": 789.72, "total_tokens": 8659424} {"current_steps": 6630, "total_steps": 12855, "loss": 0.9884, "accuracy": 1.0, "learning_rate": 2.3763296636215824e-05, "epoch": 0.5157526254375729, "percentage": 51.58, "elapsed_time": "3:02:56", "remaining_time": "2:51:45", "throughput": 789.98, "total_tokens": 8671056} {"current_steps": 6640, "total_steps": 12855, "loss": 2.1394, "accuracy": 0.8999999761581421, "learning_rate": 2.3702278484004907e-05, "epoch": 0.5165305328665889, "percentage": 51.65, "elapsed_time": "3:03:11", "remaining_time": "2:51:28", "throughput": 790.05, "total_tokens": 8683952} {"current_steps": 6650, "total_steps": 12855, "loss": 0.8247, "accuracy": 0.8999999761581421, "learning_rate": 2.364126808242163e-05, "epoch": 0.5173084402956049, "percentage": 51.73, "elapsed_time": "3:03:25", "remaining_time": "2:51:08", "throughput": 790.2, "total_tokens": 8696416} {"current_steps": 6660, "total_steps": 12855, "loss": 1.0107, "accuracy": 1.0, "learning_rate": 2.3580265795849944e-05, "epoch": 0.5180863477246208, "percentage": 51.81, "elapsed_time": "3:03:38", "remaining_time": "2:50:49", "throughput": 790.27, "total_tokens": 8707424} {"current_steps": 6670, "total_steps": 12855, "loss": 0.7268, "accuracy": 1.0, "learning_rate": 2.3519271988625344e-05, "epoch": 0.5188642551536368, "percentage": 51.89, "elapsed_time": "3:03:57", "remaining_time": "2:50:34", "throughput": 790.21, "total_tokens": 8721984} {"current_steps": 6680, "total_steps": 12855, "loss": 0.8181, "accuracy": 0.8999999761581421, "learning_rate": 2.3458287025032697e-05, "epoch": 0.5196421625826526, "percentage": 51.96, "elapsed_time": "3:04:07", "remaining_time": "2:50:12", "throughput": 790.26, "total_tokens": 8730688} {"current_steps": 6690, "total_steps": 12855, "loss": 0.9587, "accuracy": 0.8999999761581421, "learning_rate": 2.3397311269304006e-05, "epoch": 0.5204200700116686, "percentage": 52.04, "elapsed_time": "3:04:23", "remaining_time": "2:49:55", "throughput": 790.33, "total_tokens": 8744160} {"current_steps": 6700, "total_steps": 12855, "loss": 0.8714, "accuracy": 0.699999988079071, "learning_rate": 2.3336345085616324e-05, "epoch": 0.5211979774406845, "percentage": 52.12, "elapsed_time": "3:04:37", "remaining_time": "2:49:36", "throughput": 790.49, "total_tokens": 8756560} {"current_steps": 6710, "total_steps": 12855, "loss": 1.1347, "accuracy": 1.0, "learning_rate": 2.3275388838089517e-05, "epoch": 0.5219758848697005, "percentage": 52.2, "elapsed_time": "3:04:49", "remaining_time": "2:49:16", "throughput": 790.57, "total_tokens": 8767408} {"current_steps": 6720, "total_steps": 12855, "loss": 0.8482, "accuracy": 1.0, "learning_rate": 2.3214442890784107e-05, "epoch": 0.5227537922987164, "percentage": 52.28, "elapsed_time": "3:05:13", "remaining_time": "2:49:06", "throughput": 790.54, "total_tokens": 8785664} {"current_steps": 6730, "total_steps": 12855, "loss": 0.7021, "accuracy": 1.0, "learning_rate": 2.315350760769911e-05, "epoch": 0.5235316997277324, "percentage": 52.35, "elapsed_time": "3:05:23", "remaining_time": "2:48:43", "throughput": 790.67, "total_tokens": 8795008} {"current_steps": 6740, "total_steps": 12855, "loss": 1.1258, "accuracy": 1.0, "learning_rate": 2.3092583352769832e-05, "epoch": 0.5243096071567483, "percentage": 52.43, "elapsed_time": "3:05:38", "remaining_time": "2:48:25", "throughput": 790.7, "total_tokens": 8807312} {"current_steps": 6750, "total_steps": 12855, "loss": 1.1774, "accuracy": 1.0, "learning_rate": 2.303167048986573e-05, "epoch": 0.5250875145857643, "percentage": 52.51, "elapsed_time": "3:05:53", "remaining_time": "2:48:07", "throughput": 790.89, "total_tokens": 8821056} {"current_steps": 6760, "total_steps": 12855, "loss": 1.0464, "accuracy": 0.800000011920929, "learning_rate": 2.2970769382788215e-05, "epoch": 0.5258654220147803, "percentage": 52.59, "elapsed_time": "3:06:04", "remaining_time": "2:47:46", "throughput": 791.06, "total_tokens": 8831952} {"current_steps": 6770, "total_steps": 12855, "loss": 0.6572, "accuracy": 1.0, "learning_rate": 2.2909880395268478e-05, "epoch": 0.5266433294437962, "percentage": 52.66, "elapsed_time": "3:06:17", "remaining_time": "2:47:26", "throughput": 791.24, "total_tokens": 8844432} {"current_steps": 6780, "total_steps": 12855, "loss": 0.9214, "accuracy": 1.0, "learning_rate": 2.2849003890965347e-05, "epoch": 0.5274212368728122, "percentage": 52.74, "elapsed_time": "3:06:30", "remaining_time": "2:47:06", "throughput": 791.36, "total_tokens": 8855632} {"current_steps": 6790, "total_steps": 12855, "loss": 1.0254, "accuracy": 0.8999999761581421, "learning_rate": 2.278814023346307e-05, "epoch": 0.5281991443018281, "percentage": 52.82, "elapsed_time": "3:06:45", "remaining_time": "2:46:48", "throughput": 791.36, "total_tokens": 8867264} {"current_steps": 6800, "total_steps": 12855, "loss": 0.9748, "accuracy": 1.0, "learning_rate": 2.2727289786269177e-05, "epoch": 0.5289770517308441, "percentage": 52.9, "elapsed_time": "3:06:56", "remaining_time": "2:46:27", "throughput": 791.65, "total_tokens": 8879312} {"current_steps": 6810, "total_steps": 12855, "loss": 0.9884, "accuracy": 1.0, "learning_rate": 2.2666452912812326e-05, "epoch": 0.5297549591598599, "percentage": 52.98, "elapsed_time": "3:07:08", "remaining_time": "2:46:06", "throughput": 791.74, "total_tokens": 8889840} {"current_steps": 6820, "total_steps": 12855, "loss": 1.0548, "accuracy": 1.0, "learning_rate": 2.2605629976440054e-05, "epoch": 0.5305328665888759, "percentage": 53.05, "elapsed_time": "3:07:19", "remaining_time": "2:45:45", "throughput": 791.88, "total_tokens": 8900288} {"current_steps": 6830, "total_steps": 12855, "loss": 0.8124, "accuracy": 0.800000011920929, "learning_rate": 2.2544821340416696e-05, "epoch": 0.5313107740178918, "percentage": 53.13, "elapsed_time": "3:07:34", "remaining_time": "2:45:28", "throughput": 792.02, "total_tokens": 8913792} {"current_steps": 6840, "total_steps": 12855, "loss": 0.9119, "accuracy": 1.0, "learning_rate": 2.2484027367921172e-05, "epoch": 0.5320886814469078, "percentage": 53.21, "elapsed_time": "3:07:46", "remaining_time": "2:45:07", "throughput": 792.1, "total_tokens": 8924320} {"current_steps": 6850, "total_steps": 12855, "loss": 0.8929, "accuracy": 0.800000011920929, "learning_rate": 2.2423248422044812e-05, "epoch": 0.5328665888759238, "percentage": 53.29, "elapsed_time": "3:07:56", "remaining_time": "2:44:45", "throughput": 792.25, "total_tokens": 8933520} {"current_steps": 6860, "total_steps": 12855, "loss": 0.8283, "accuracy": 0.8999999761581421, "learning_rate": 2.2362484865789222e-05, "epoch": 0.5336444963049397, "percentage": 53.36, "elapsed_time": "3:08:14", "remaining_time": "2:44:29", "throughput": 792.26, "total_tokens": 8947824} {"current_steps": 6870, "total_steps": 12855, "loss": 0.9492, "accuracy": 1.0, "learning_rate": 2.230173706206408e-05, "epoch": 0.5344224037339557, "percentage": 53.44, "elapsed_time": "3:08:34", "remaining_time": "2:44:16", "throughput": 792.24, "total_tokens": 8963552} {"current_steps": 6880, "total_steps": 12855, "loss": 1.0958, "accuracy": 1.0, "learning_rate": 2.2241005373684973e-05, "epoch": 0.5352003111629716, "percentage": 53.52, "elapsed_time": "3:08:44", "remaining_time": "2:43:55", "throughput": 792.39, "total_tokens": 8973680} {"current_steps": 6890, "total_steps": 12855, "loss": 0.8035, "accuracy": 1.0, "learning_rate": 2.2180290163371254e-05, "epoch": 0.5359782185919876, "percentage": 53.6, "elapsed_time": "3:09:02", "remaining_time": "2:43:40", "throughput": 792.24, "total_tokens": 8986320} {"current_steps": 6900, "total_steps": 12855, "loss": 1.0727, "accuracy": 0.800000011920929, "learning_rate": 2.2119591793743858e-05, "epoch": 0.5367561260210035, "percentage": 53.68, "elapsed_time": "3:09:15", "remaining_time": "2:43:20", "throughput": 792.35, "total_tokens": 8997776} {"current_steps": 6910, "total_steps": 12855, "loss": 0.9051, "accuracy": 0.800000011920929, "learning_rate": 2.205891062732313e-05, "epoch": 0.5375340334500195, "percentage": 53.75, "elapsed_time": "3:09:27", "remaining_time": "2:43:00", "throughput": 792.45, "total_tokens": 9008288} {"current_steps": 6920, "total_steps": 12855, "loss": 0.9325, "accuracy": 0.8999999761581421, "learning_rate": 2.1998247026526687e-05, "epoch": 0.5383119408790354, "percentage": 53.83, "elapsed_time": "3:09:51", "remaining_time": "2:42:50", "throughput": 792.19, "total_tokens": 9024400} {"current_steps": 6930, "total_steps": 12855, "loss": 1.2041, "accuracy": 0.800000011920929, "learning_rate": 2.1937601353667224e-05, "epoch": 0.5390898483080513, "percentage": 53.91, "elapsed_time": "3:10:02", "remaining_time": "2:42:28", "throughput": 792.35, "total_tokens": 9034432} {"current_steps": 6940, "total_steps": 12855, "loss": 0.9098, "accuracy": 1.0, "learning_rate": 2.187697397095035e-05, "epoch": 0.5398677557370672, "percentage": 53.99, "elapsed_time": "3:10:14", "remaining_time": "2:42:08", "throughput": 792.53, "total_tokens": 9046656} {"current_steps": 6950, "total_steps": 12855, "loss": 0.9026, "accuracy": 0.8999999761581421, "learning_rate": 2.1816365240472458e-05, "epoch": 0.5406456631660832, "percentage": 54.06, "elapsed_time": "3:10:32", "remaining_time": "2:41:53", "throughput": 792.56, "total_tokens": 9061104} {"current_steps": 6960, "total_steps": 12855, "loss": 1.0318, "accuracy": 0.8999999761581421, "learning_rate": 2.175577552421853e-05, "epoch": 0.5414235705950992, "percentage": 54.14, "elapsed_time": "3:10:51", "remaining_time": "2:41:39", "throughput": 792.52, "total_tokens": 9075488} {"current_steps": 6970, "total_steps": 12855, "loss": 0.7524, "accuracy": 1.0, "learning_rate": 2.1695205184059987e-05, "epoch": 0.5422014780241151, "percentage": 54.22, "elapsed_time": "3:11:06", "remaining_time": "2:41:21", "throughput": 792.55, "total_tokens": 9087680} {"current_steps": 6980, "total_steps": 12855, "loss": 1.0431, "accuracy": 1.0, "learning_rate": 2.1634654581752517e-05, "epoch": 0.5429793854531311, "percentage": 54.3, "elapsed_time": "3:11:23", "remaining_time": "2:41:05", "throughput": 792.76, "total_tokens": 9103792} {"current_steps": 6990, "total_steps": 12855, "loss": 0.9666, "accuracy": 1.0, "learning_rate": 2.1574124078933953e-05, "epoch": 0.543757292882147, "percentage": 54.38, "elapsed_time": "3:11:42", "remaining_time": "2:40:51", "throughput": 792.83, "total_tokens": 9119392} {"current_steps": 7000, "total_steps": 12855, "loss": 0.9071, "accuracy": 1.0, "learning_rate": 2.151361403712205e-05, "epoch": 0.544535200311163, "percentage": 54.45, "elapsed_time": "3:11:55", "remaining_time": "2:40:32", "throughput": 792.93, "total_tokens": 9131184} {"current_steps": 7010, "total_steps": 12855, "loss": 1.0268, "accuracy": 1.0, "learning_rate": 2.1453124817712382e-05, "epoch": 0.5453131077401789, "percentage": 54.53, "elapsed_time": "3:12:22", "remaining_time": "2:40:24", "throughput": 792.32, "total_tokens": 9145184} {"current_steps": 7020, "total_steps": 12855, "loss": 1.0347, "accuracy": 0.699999988079071, "learning_rate": 2.1392656781976147e-05, "epoch": 0.5460910151691949, "percentage": 54.61, "elapsed_time": "3:12:40", "remaining_time": "2:40:09", "throughput": 792.49, "total_tokens": 9161856} {"current_steps": 7030, "total_steps": 12855, "loss": 1.1721, "accuracy": 1.0, "learning_rate": 2.1332210291058037e-05, "epoch": 0.5468689225982108, "percentage": 54.69, "elapsed_time": "3:13:03", "remaining_time": "2:39:57", "throughput": 792.29, "total_tokens": 9177152} {"current_steps": 7040, "total_steps": 12855, "loss": 0.9255, "accuracy": 0.800000011920929, "learning_rate": 2.1271785705974058e-05, "epoch": 0.5476468300272268, "percentage": 54.76, "elapsed_time": "3:13:20", "remaining_time": "2:39:41", "throughput": 792.37, "total_tokens": 9191776} {"current_steps": 7050, "total_steps": 12855, "loss": 0.8748, "accuracy": 1.0, "learning_rate": 2.1211383387609383e-05, "epoch": 0.5484247374562428, "percentage": 54.84, "elapsed_time": "3:13:45", "remaining_time": "2:39:32", "throughput": 792.08, "total_tokens": 9208192} {"current_steps": 7060, "total_steps": 12855, "loss": 1.0409, "accuracy": 0.8999999761581421, "learning_rate": 2.1151003696716217e-05, "epoch": 0.5492026448852586, "percentage": 54.92, "elapsed_time": "3:13:57", "remaining_time": "2:39:12", "throughput": 792.31, "total_tokens": 9220816} {"current_steps": 7070, "total_steps": 12855, "loss": 0.8847, "accuracy": 1.0, "learning_rate": 2.1090646993911588e-05, "epoch": 0.5499805523142746, "percentage": 55.0, "elapsed_time": "3:14:13", "remaining_time": "2:38:55", "throughput": 792.41, "total_tokens": 9233984} {"current_steps": 7080, "total_steps": 12855, "loss": 0.9708, "accuracy": 0.699999988079071, "learning_rate": 2.1030313639675253e-05, "epoch": 0.5507584597432905, "percentage": 55.08, "elapsed_time": "3:14:26", "remaining_time": "2:38:36", "throughput": 792.45, "total_tokens": 9245328} {"current_steps": 7090, "total_steps": 12855, "loss": 1.0218, "accuracy": 0.8999999761581421, "learning_rate": 2.0970003994347514e-05, "epoch": 0.5515363671723065, "percentage": 55.15, "elapsed_time": "3:14:45", "remaining_time": "2:38:21", "throughput": 792.44, "total_tokens": 9259760} {"current_steps": 7100, "total_steps": 12855, "loss": 1.0323, "accuracy": 1.0, "learning_rate": 2.0909718418127077e-05, "epoch": 0.5523142746013224, "percentage": 55.23, "elapsed_time": "3:15:00", "remaining_time": "2:38:03", "throughput": 792.58, "total_tokens": 9273216} {"current_steps": 7110, "total_steps": 12855, "loss": 0.9503, "accuracy": 0.8999999761581421, "learning_rate": 2.084945727106888e-05, "epoch": 0.5530921820303384, "percentage": 55.31, "elapsed_time": "3:15:14", "remaining_time": "2:37:45", "throughput": 792.56, "total_tokens": 9284144} {"current_steps": 7120, "total_steps": 12855, "loss": 2.4995, "accuracy": 0.8999999761581421, "learning_rate": 2.0789220913081973e-05, "epoch": 0.5538700894593543, "percentage": 55.39, "elapsed_time": "3:15:25", "remaining_time": "2:37:24", "throughput": 792.68, "total_tokens": 9294624} {"current_steps": 7130, "total_steps": 12855, "loss": 0.9927, "accuracy": 1.0, "learning_rate": 2.0729009703927353e-05, "epoch": 0.5546479968883703, "percentage": 55.46, "elapsed_time": "3:15:43", "remaining_time": "2:37:09", "throughput": 792.65, "total_tokens": 9308192} {"current_steps": 7140, "total_steps": 12855, "loss": 0.9522, "accuracy": 1.0, "learning_rate": 2.066882400321581e-05, "epoch": 0.5554259043173863, "percentage": 55.54, "elapsed_time": "3:16:01", "remaining_time": "2:36:54", "throughput": 792.75, "total_tokens": 9323920} {"current_steps": 7150, "total_steps": 12855, "loss": 0.8797, "accuracy": 1.0, "learning_rate": 2.0608664170405783e-05, "epoch": 0.5562038117464022, "percentage": 55.62, "elapsed_time": "3:16:21", "remaining_time": "2:36:40", "throughput": 792.77, "total_tokens": 9339744} {"current_steps": 7160, "total_steps": 12855, "loss": 1.199, "accuracy": 1.0, "learning_rate": 2.054853056480122e-05, "epoch": 0.5569817191754182, "percentage": 55.7, "elapsed_time": "3:16:57", "remaining_time": "2:36:39", "throughput": 791.75, "total_tokens": 9356800} {"current_steps": 7170, "total_steps": 12855, "loss": 0.7792, "accuracy": 1.0, "learning_rate": 2.048842354554943e-05, "epoch": 0.5577596266044341, "percentage": 55.78, "elapsed_time": "3:17:14", "remaining_time": "2:36:23", "throughput": 791.81, "total_tokens": 9370544} {"current_steps": 7180, "total_steps": 12855, "loss": 0.8138, "accuracy": 0.8999999761581421, "learning_rate": 2.0428343471638933e-05, "epoch": 0.55853753403345, "percentage": 55.85, "elapsed_time": "3:17:26", "remaining_time": "2:36:03", "throughput": 791.84, "total_tokens": 9380608} {"current_steps": 7190, "total_steps": 12855, "loss": 0.9823, "accuracy": 0.8999999761581421, "learning_rate": 2.0368290701897306e-05, "epoch": 0.5593154414624659, "percentage": 55.93, "elapsed_time": "3:17:36", "remaining_time": "2:35:41", "throughput": 791.91, "total_tokens": 9389424} {"current_steps": 7200, "total_steps": 12855, "loss": 0.8881, "accuracy": 1.0, "learning_rate": 2.030826559498907e-05, "epoch": 0.5600933488914819, "percentage": 56.01, "elapsed_time": "3:17:58", "remaining_time": "2:35:29", "throughput": 791.83, "total_tokens": 9405392} {"current_steps": 7210, "total_steps": 12855, "loss": 1.3145, "accuracy": 0.699999988079071, "learning_rate": 2.0248268509413522e-05, "epoch": 0.5608712563204978, "percentage": 56.09, "elapsed_time": "3:18:15", "remaining_time": "2:35:13", "throughput": 791.82, "total_tokens": 9419088} {"current_steps": 7220, "total_steps": 12855, "loss": 1.061, "accuracy": 0.8999999761581421, "learning_rate": 2.01882998035026e-05, "epoch": 0.5616491637495138, "percentage": 56.16, "elapsed_time": "3:18:57", "remaining_time": "2:35:16", "throughput": 790.72, "total_tokens": 9439232} {"current_steps": 7230, "total_steps": 12855, "loss": 0.8583, "accuracy": 1.0, "learning_rate": 2.012835983541876e-05, "epoch": 0.5624270711785297, "percentage": 56.24, "elapsed_time": "3:19:23", "remaining_time": "2:35:07", "throughput": 790.46, "total_tokens": 9456352} {"current_steps": 7240, "total_steps": 12855, "loss": 0.9786, "accuracy": 1.0, "learning_rate": 2.0068448963152786e-05, "epoch": 0.5632049786075457, "percentage": 56.32, "elapsed_time": "3:19:35", "remaining_time": "2:34:47", "throughput": 790.56, "total_tokens": 9467104} {"current_steps": 7250, "total_steps": 12855, "loss": 0.989, "accuracy": 1.0, "learning_rate": 2.000856754452173e-05, "epoch": 0.5639828860365617, "percentage": 56.4, "elapsed_time": "3:19:52", "remaining_time": "2:34:31", "throughput": 790.53, "total_tokens": 9480304} {"current_steps": 7260, "total_steps": 12855, "loss": 0.9374, "accuracy": 0.8999999761581421, "learning_rate": 1.9948715937166708e-05, "epoch": 0.5647607934655776, "percentage": 56.48, "elapsed_time": "3:20:13", "remaining_time": "2:34:18", "throughput": 790.49, "total_tokens": 9496448} {"current_steps": 7270, "total_steps": 12855, "loss": 0.7117, "accuracy": 1.0, "learning_rate": 1.9888894498550798e-05, "epoch": 0.5655387008945936, "percentage": 56.55, "elapsed_time": "3:20:31", "remaining_time": "2:34:02", "throughput": 790.42, "total_tokens": 9509680} {"current_steps": 7280, "total_steps": 12855, "loss": 0.8988, "accuracy": 0.8999999761581421, "learning_rate": 1.9829103585956882e-05, "epoch": 0.5663166083236095, "percentage": 56.63, "elapsed_time": "3:20:46", "remaining_time": "2:33:45", "throughput": 790.57, "total_tokens": 9523712} {"current_steps": 7290, "total_steps": 12855, "loss": 0.8419, "accuracy": 0.8999999761581421, "learning_rate": 1.9769343556485544e-05, "epoch": 0.5670945157526255, "percentage": 56.71, "elapsed_time": "3:20:56", "remaining_time": "2:33:23", "throughput": 790.71, "total_tokens": 9533104} {"current_steps": 7300, "total_steps": 12855, "loss": 2.1731, "accuracy": 0.800000011920929, "learning_rate": 1.97096147670529e-05, "epoch": 0.5678724231816414, "percentage": 56.79, "elapsed_time": "3:21:10", "remaining_time": "2:33:04", "throughput": 790.72, "total_tokens": 9544176} {"current_steps": 7310, "total_steps": 12855, "loss": 0.8518, "accuracy": 1.0, "learning_rate": 1.964991757438851e-05, "epoch": 0.5686503306106573, "percentage": 56.87, "elapsed_time": "3:21:23", "remaining_time": "2:32:45", "throughput": 790.73, "total_tokens": 9554544} {"current_steps": 7320, "total_steps": 12855, "loss": 0.7806, "accuracy": 1.0, "learning_rate": 1.9590252335033193e-05, "epoch": 0.5694282380396732, "percentage": 56.94, "elapsed_time": "3:21:33", "remaining_time": "2:32:24", "throughput": 790.85, "total_tokens": 9564480} {"current_steps": 7330, "total_steps": 12855, "loss": 0.875, "accuracy": 1.0, "learning_rate": 1.953061940533695e-05, "epoch": 0.5702061454686892, "percentage": 57.02, "elapsed_time": "3:21:42", "remaining_time": "2:32:02", "throughput": 791.13, "total_tokens": 9574912} {"current_steps": 7340, "total_steps": 12855, "loss": 0.95, "accuracy": 0.800000011920929, "learning_rate": 1.94710191414568e-05, "epoch": 0.5709840528977052, "percentage": 57.1, "elapsed_time": "3:22:02", "remaining_time": "2:31:48", "throughput": 790.88, "total_tokens": 9587824} {"current_steps": 7350, "total_steps": 12855, "loss": 0.9723, "accuracy": 1.0, "learning_rate": 1.941145189935467e-05, "epoch": 0.5717619603267211, "percentage": 57.18, "elapsed_time": "3:22:16", "remaining_time": "2:31:29", "throughput": 790.97, "total_tokens": 9599248} {"current_steps": 7360, "total_steps": 12855, "loss": 0.7599, "accuracy": 0.8999999761581421, "learning_rate": 1.935191803479527e-05, "epoch": 0.5725398677557371, "percentage": 57.25, "elapsed_time": "3:22:26", "remaining_time": "2:31:08", "throughput": 791.12, "total_tokens": 9609584} {"current_steps": 7370, "total_steps": 12855, "loss": 1.1131, "accuracy": 0.8999999761581421, "learning_rate": 1.9292417903343953e-05, "epoch": 0.573317775184753, "percentage": 57.33, "elapsed_time": "3:22:52", "remaining_time": "2:30:59", "throughput": 791.06, "total_tokens": 9629072} {"current_steps": 7380, "total_steps": 12855, "loss": 0.9861, "accuracy": 1.0, "learning_rate": 1.923295186036461e-05, "epoch": 0.574095682613769, "percentage": 57.41, "elapsed_time": "3:23:08", "remaining_time": "2:30:42", "throughput": 791.03, "total_tokens": 9641760} {"current_steps": 7390, "total_steps": 12855, "loss": 3.1164, "accuracy": 0.8999999761581421, "learning_rate": 1.917352026101754e-05, "epoch": 0.5748735900427849, "percentage": 57.49, "elapsed_time": "3:23:30", "remaining_time": "2:30:29", "throughput": 791.13, "total_tokens": 9659728} {"current_steps": 7400, "total_steps": 12855, "loss": 0.8919, "accuracy": 0.8999999761581421, "learning_rate": 1.9114123460257317e-05, "epoch": 0.5756514974718009, "percentage": 57.57, "elapsed_time": "3:23:40", "remaining_time": "2:30:08", "throughput": 791.28, "total_tokens": 9669920} {"current_steps": 7410, "total_steps": 12855, "loss": 1.1206, "accuracy": 0.699999988079071, "learning_rate": 1.905476181283069e-05, "epoch": 0.5764294049008168, "percentage": 57.64, "elapsed_time": "3:23:50", "remaining_time": "2:29:47", "throughput": 791.44, "total_tokens": 9679776} {"current_steps": 7420, "total_steps": 12855, "loss": 0.9453, "accuracy": 0.8999999761581421, "learning_rate": 1.8995435673274452e-05, "epoch": 0.5772073123298328, "percentage": 57.72, "elapsed_time": "3:24:05", "remaining_time": "2:29:29", "throughput": 791.58, "total_tokens": 9693408} {"current_steps": 7430, "total_steps": 12855, "loss": 0.9898, "accuracy": 0.8999999761581421, "learning_rate": 1.8936145395913336e-05, "epoch": 0.5779852197588486, "percentage": 57.8, "elapsed_time": "3:24:23", "remaining_time": "2:29:13", "throughput": 791.65, "total_tokens": 9708144} {"current_steps": 7440, "total_steps": 12855, "loss": 1.0364, "accuracy": 0.8999999761581421, "learning_rate": 1.8876891334857858e-05, "epoch": 0.5787631271878646, "percentage": 57.88, "elapsed_time": "3:24:33", "remaining_time": "2:28:52", "throughput": 791.8, "total_tokens": 9717872} {"current_steps": 7450, "total_steps": 12855, "loss": 0.984, "accuracy": 0.8999999761581421, "learning_rate": 1.8817673844002264e-05, "epoch": 0.5795410346168806, "percentage": 57.95, "elapsed_time": "3:24:44", "remaining_time": "2:28:32", "throughput": 791.86, "total_tokens": 9727408} {"current_steps": 7460, "total_steps": 12855, "loss": 0.7025, "accuracy": 1.0, "learning_rate": 1.8758493277022377e-05, "epoch": 0.5803189420458965, "percentage": 58.03, "elapsed_time": "3:24:58", "remaining_time": "2:28:14", "throughput": 792.04, "total_tokens": 9741200} {"current_steps": 7470, "total_steps": 12855, "loss": 1.0205, "accuracy": 0.8999999761581421, "learning_rate": 1.8699349987373482e-05, "epoch": 0.5810968494749125, "percentage": 58.11, "elapsed_time": "3:25:17", "remaining_time": "2:27:59", "throughput": 792.07, "total_tokens": 9756272} {"current_steps": 7480, "total_steps": 12855, "loss": 1.0946, "accuracy": 1.0, "learning_rate": 1.8640244328288237e-05, "epoch": 0.5818747569039284, "percentage": 58.19, "elapsed_time": "3:25:34", "remaining_time": "2:27:43", "throughput": 792.09, "total_tokens": 9770016} {"current_steps": 7490, "total_steps": 12855, "loss": 1.0262, "accuracy": 0.8999999761581421, "learning_rate": 1.8581176652774552e-05, "epoch": 0.5826526643329444, "percentage": 58.27, "elapsed_time": "3:25:51", "remaining_time": "2:27:27", "throughput": 792.23, "total_tokens": 9785408} {"current_steps": 7500, "total_steps": 12855, "loss": 0.8332, "accuracy": 1.0, "learning_rate": 1.8522147313613463e-05, "epoch": 0.5834305717619603, "percentage": 58.34, "elapsed_time": "3:26:05", "remaining_time": "2:27:09", "throughput": 792.25, "total_tokens": 9796592} {"current_steps": 7510, "total_steps": 12855, "loss": 0.9489, "accuracy": 1.0, "learning_rate": 1.8463156663357067e-05, "epoch": 0.5842084791909763, "percentage": 58.42, "elapsed_time": "3:26:37", "remaining_time": "2:27:03", "throughput": 791.68, "total_tokens": 9814848} {"current_steps": 7520, "total_steps": 12855, "loss": 1.1481, "accuracy": 0.800000011920929, "learning_rate": 1.8404205054326385e-05, "epoch": 0.5849863866199922, "percentage": 58.5, "elapsed_time": "3:26:54", "remaining_time": "2:26:47", "throughput": 791.73, "total_tokens": 9829264} {"current_steps": 7530, "total_steps": 12855, "loss": 0.917, "accuracy": 1.0, "learning_rate": 1.834529283860925e-05, "epoch": 0.5857642940490082, "percentage": 58.58, "elapsed_time": "3:27:02", "remaining_time": "2:26:24", "throughput": 791.95, "total_tokens": 9838160} {"current_steps": 7540, "total_steps": 12855, "loss": 0.7729, "accuracy": 0.8999999761581421, "learning_rate": 1.828642036805823e-05, "epoch": 0.5865422014780242, "percentage": 58.65, "elapsed_time": "3:27:14", "remaining_time": "2:26:04", "throughput": 792.1, "total_tokens": 9848976} {"current_steps": 7550, "total_steps": 12855, "loss": 0.8381, "accuracy": 1.0, "learning_rate": 1.8227587994288527e-05, "epoch": 0.5873201089070401, "percentage": 58.73, "elapsed_time": "3:27:26", "remaining_time": "2:25:45", "throughput": 792.26, "total_tokens": 9860736} {"current_steps": 7560, "total_steps": 12855, "loss": 0.9545, "accuracy": 1.0, "learning_rate": 1.8168796068675846e-05, "epoch": 0.588098016336056, "percentage": 58.81, "elapsed_time": "3:27:40", "remaining_time": "2:25:27", "throughput": 792.35, "total_tokens": 9872784} {"current_steps": 7570, "total_steps": 12855, "loss": 0.8773, "accuracy": 1.0, "learning_rate": 1.8110044942354316e-05, "epoch": 0.5888759237650719, "percentage": 58.89, "elapsed_time": "3:27:53", "remaining_time": "2:25:08", "throughput": 792.4, "total_tokens": 9883712} {"current_steps": 7580, "total_steps": 12855, "loss": 0.8084, "accuracy": 1.0, "learning_rate": 1.8051334966214407e-05, "epoch": 0.5896538311940879, "percentage": 58.97, "elapsed_time": "3:28:13", "remaining_time": "2:24:54", "throughput": 792.41, "total_tokens": 9899888} {"current_steps": 7590, "total_steps": 12855, "loss": 0.875, "accuracy": 1.0, "learning_rate": 1.799266649090081e-05, "epoch": 0.5904317386231038, "percentage": 59.04, "elapsed_time": "3:28:25", "remaining_time": "2:24:34", "throughput": 792.49, "total_tokens": 9910800} {"current_steps": 7600, "total_steps": 12855, "loss": 1.0155, "accuracy": 0.8999999761581421, "learning_rate": 1.7934039866810355e-05, "epoch": 0.5912096460521198, "percentage": 59.12, "elapsed_time": "3:28:34", "remaining_time": "2:24:12", "throughput": 792.66, "total_tokens": 9919408} {"current_steps": 7610, "total_steps": 12855, "loss": 0.9998, "accuracy": 0.8999999761581421, "learning_rate": 1.7875455444089924e-05, "epoch": 0.5919875534811357, "percentage": 59.2, "elapsed_time": "3:28:42", "remaining_time": "2:23:50", "throughput": 792.76, "total_tokens": 9927168} {"current_steps": 7620, "total_steps": 12855, "loss": 0.7437, "accuracy": 1.0, "learning_rate": 1.781691357263433e-05, "epoch": 0.5927654609101517, "percentage": 59.28, "elapsed_time": "3:28:51", "remaining_time": "2:23:29", "throughput": 792.82, "total_tokens": 9935056} {"current_steps": 7630, "total_steps": 12855, "loss": 0.8539, "accuracy": 1.0, "learning_rate": 1.7758414602084278e-05, "epoch": 0.5935433683391677, "percentage": 59.35, "elapsed_time": "3:29:05", "remaining_time": "2:23:11", "throughput": 792.83, "total_tokens": 9946608} {"current_steps": 7640, "total_steps": 12855, "loss": 0.9926, "accuracy": 0.800000011920929, "learning_rate": 1.7699958881824217e-05, "epoch": 0.5943212757681836, "percentage": 59.43, "elapsed_time": "3:29:26", "remaining_time": "2:22:57", "throughput": 792.72, "total_tokens": 9961696} {"current_steps": 7650, "total_steps": 12855, "loss": 0.8647, "accuracy": 1.0, "learning_rate": 1.7641546760980322e-05, "epoch": 0.5950991831971996, "percentage": 59.51, "elapsed_time": "3:29:42", "remaining_time": "2:22:41", "throughput": 792.79, "total_tokens": 9975360} {"current_steps": 7660, "total_steps": 12855, "loss": 0.8456, "accuracy": 0.8999999761581421, "learning_rate": 1.7583178588418336e-05, "epoch": 0.5958770906262155, "percentage": 59.59, "elapsed_time": "3:29:55", "remaining_time": "2:22:22", "throughput": 792.99, "total_tokens": 9988336} {"current_steps": 7670, "total_steps": 12855, "loss": 0.9245, "accuracy": 0.800000011920929, "learning_rate": 1.7524854712741535e-05, "epoch": 0.5966549980552315, "percentage": 59.67, "elapsed_time": "3:30:05", "remaining_time": "2:22:01", "throughput": 793.21, "total_tokens": 9998880} {"current_steps": 7680, "total_steps": 12855, "loss": 1.0377, "accuracy": 0.8999999761581421, "learning_rate": 1.7466575482288642e-05, "epoch": 0.5974329054842473, "percentage": 59.74, "elapsed_time": "3:30:27", "remaining_time": "2:21:48", "throughput": 793.07, "total_tokens": 10014272} {"current_steps": 7690, "total_steps": 12855, "loss": 0.9588, "accuracy": 0.8999999761581421, "learning_rate": 1.7408341245131704e-05, "epoch": 0.5982108129132633, "percentage": 59.82, "elapsed_time": "3:30:41", "remaining_time": "2:21:30", "throughput": 793.15, "total_tokens": 10026672} {"current_steps": 7700, "total_steps": 12855, "loss": 0.8349, "accuracy": 0.8999999761581421, "learning_rate": 1.7350152349074083e-05, "epoch": 0.5989887203422792, "percentage": 59.9, "elapsed_time": "3:30:56", "remaining_time": "2:21:13", "throughput": 793.32, "total_tokens": 10040640} {"current_steps": 7710, "total_steps": 12855, "loss": 0.7401, "accuracy": 1.0, "learning_rate": 1.7292009141648335e-05, "epoch": 0.5997666277712952, "percentage": 59.98, "elapsed_time": "3:31:09", "remaining_time": "2:20:54", "throughput": 793.38, "total_tokens": 10051408} {"current_steps": 7720, "total_steps": 12855, "loss": 0.8534, "accuracy": 0.800000011920929, "learning_rate": 1.723391197011412e-05, "epoch": 0.6005445352003111, "percentage": 60.05, "elapsed_time": "3:31:23", "remaining_time": "2:20:36", "throughput": 793.53, "total_tokens": 10064832} {"current_steps": 7730, "total_steps": 12855, "loss": 1.0536, "accuracy": 0.8999999761581421, "learning_rate": 1.717586118145617e-05, "epoch": 0.6013224426293271, "percentage": 60.13, "elapsed_time": "3:31:37", "remaining_time": "2:20:18", "throughput": 793.68, "total_tokens": 10078064} {"current_steps": 7740, "total_steps": 12855, "loss": 0.7957, "accuracy": 0.8999999761581421, "learning_rate": 1.711785712238219e-05, "epoch": 0.6021003500583431, "percentage": 60.21, "elapsed_time": "3:31:58", "remaining_time": "2:20:04", "throughput": 793.61, "total_tokens": 10093328} {"current_steps": 7750, "total_steps": 12855, "loss": 0.7803, "accuracy": 1.0, "learning_rate": 1.7059900139320788e-05, "epoch": 0.602878257487359, "percentage": 60.29, "elapsed_time": "3:32:09", "remaining_time": "2:19:45", "throughput": 793.79, "total_tokens": 10104752} {"current_steps": 7760, "total_steps": 12855, "loss": 1.0745, "accuracy": 1.0, "learning_rate": 1.700199057841942e-05, "epoch": 0.603656164916375, "percentage": 60.37, "elapsed_time": "3:32:23", "remaining_time": "2:19:26", "throughput": 793.92, "total_tokens": 10117184} {"current_steps": 7770, "total_steps": 12855, "loss": 1.0178, "accuracy": 1.0, "learning_rate": 1.694412878554229e-05, "epoch": 0.6044340723453909, "percentage": 60.44, "elapsed_time": "3:32:35", "remaining_time": "2:19:07", "throughput": 794.13, "total_tokens": 10129328} {"current_steps": 7780, "total_steps": 12855, "loss": 1.2516, "accuracy": 0.8999999761581421, "learning_rate": 1.6886315106268356e-05, "epoch": 0.6052119797744069, "percentage": 60.52, "elapsed_time": "3:32:50", "remaining_time": "2:18:50", "throughput": 794.16, "total_tokens": 10142144} {"current_steps": 7790, "total_steps": 12855, "loss": 0.8922, "accuracy": 1.0, "learning_rate": 1.6828549885889168e-05, "epoch": 0.6059898872034228, "percentage": 60.6, "elapsed_time": "3:33:01", "remaining_time": "2:18:30", "throughput": 794.36, "total_tokens": 10153456} {"current_steps": 7800, "total_steps": 12855, "loss": 0.9184, "accuracy": 0.8999999761581421, "learning_rate": 1.677083346940688e-05, "epoch": 0.6067677946324388, "percentage": 60.68, "elapsed_time": "3:33:21", "remaining_time": "2:18:16", "throughput": 794.27, "total_tokens": 10167520} {"current_steps": 7810, "total_steps": 12855, "loss": 0.8519, "accuracy": 0.8999999761581421, "learning_rate": 1.671316620153218e-05, "epoch": 0.6075457020614546, "percentage": 60.75, "elapsed_time": "3:33:35", "remaining_time": "2:17:58", "throughput": 794.31, "total_tokens": 10179824} {"current_steps": 7820, "total_steps": 12855, "loss": 0.7911, "accuracy": 1.0, "learning_rate": 1.665554842668216e-05, "epoch": 0.6083236094904706, "percentage": 60.83, "elapsed_time": "3:34:13", "remaining_time": "2:17:55", "throughput": 793.57, "total_tokens": 10200016} {"current_steps": 7830, "total_steps": 12855, "loss": 1.1917, "accuracy": 0.8999999761581421, "learning_rate": 1.6597980488978383e-05, "epoch": 0.6091015169194866, "percentage": 60.91, "elapsed_time": "3:34:21", "remaining_time": "2:17:34", "throughput": 793.79, "total_tokens": 10209760} {"current_steps": 7840, "total_steps": 12855, "loss": 1.0491, "accuracy": 1.0, "learning_rate": 1.654046273224472e-05, "epoch": 0.6098794243485025, "percentage": 60.99, "elapsed_time": "3:34:38", "remaining_time": "2:17:17", "throughput": 793.92, "total_tokens": 10224176} {"current_steps": 7850, "total_steps": 12855, "loss": 1.1298, "accuracy": 1.0, "learning_rate": 1.648299550000535e-05, "epoch": 0.6106573317775185, "percentage": 61.07, "elapsed_time": "3:34:51", "remaining_time": "2:16:59", "throughput": 794.03, "total_tokens": 10236544} {"current_steps": 7860, "total_steps": 12855, "loss": 0.8854, "accuracy": 0.800000011920929, "learning_rate": 1.6425579135482693e-05, "epoch": 0.6114352392065344, "percentage": 61.14, "elapsed_time": "3:35:04", "remaining_time": "2:16:41", "throughput": 794.09, "total_tokens": 10247648} {"current_steps": 7870, "total_steps": 12855, "loss": 0.9465, "accuracy": 0.8999999761581421, "learning_rate": 1.636821398159536e-05, "epoch": 0.6122131466355504, "percentage": 61.22, "elapsed_time": "3:35:17", "remaining_time": "2:16:22", "throughput": 794.21, "total_tokens": 10259424} {"current_steps": 7880, "total_steps": 12855, "loss": 0.7377, "accuracy": 1.0, "learning_rate": 1.6310900380956107e-05, "epoch": 0.6129910540645663, "percentage": 61.3, "elapsed_time": "3:35:32", "remaining_time": "2:16:04", "throughput": 794.35, "total_tokens": 10272656} {"current_steps": 7890, "total_steps": 12855, "loss": 1.2778, "accuracy": 0.699999988079071, "learning_rate": 1.625363867586979e-05, "epoch": 0.6137689614935823, "percentage": 61.38, "elapsed_time": "3:35:44", "remaining_time": "2:15:45", "throughput": 794.45, "total_tokens": 10283520} {"current_steps": 7900, "total_steps": 12855, "loss": 1.8524, "accuracy": 1.0, "learning_rate": 1.619642920833132e-05, "epoch": 0.6145468689225982, "percentage": 61.45, "elapsed_time": "3:36:05", "remaining_time": "2:15:32", "throughput": 794.44, "total_tokens": 10300160} {"current_steps": 7910, "total_steps": 12855, "loss": 0.7941, "accuracy": 1.0, "learning_rate": 1.6139272320023623e-05, "epoch": 0.6153247763516142, "percentage": 61.53, "elapsed_time": "3:36:20", "remaining_time": "2:15:14", "throughput": 794.62, "total_tokens": 10314528} {"current_steps": 7920, "total_steps": 12855, "loss": 1.0317, "accuracy": 0.800000011920929, "learning_rate": 1.6082168352315595e-05, "epoch": 0.6161026837806302, "percentage": 61.61, "elapsed_time": "3:36:36", "remaining_time": "2:14:58", "throughput": 794.65, "total_tokens": 10327776} {"current_steps": 7930, "total_steps": 12855, "loss": 1.34, "accuracy": 0.8999999761581421, "learning_rate": 1.6025117646260064e-05, "epoch": 0.616880591209646, "percentage": 61.69, "elapsed_time": "3:37:00", "remaining_time": "2:14:46", "throughput": 794.48, "total_tokens": 10344272} {"current_steps": 7940, "total_steps": 12855, "loss": 0.8567, "accuracy": 0.800000011920929, "learning_rate": 1.5968120542591737e-05, "epoch": 0.617658498638662, "percentage": 61.77, "elapsed_time": "3:37:17", "remaining_time": "2:14:30", "throughput": 794.45, "total_tokens": 10357504} {"current_steps": 7950, "total_steps": 12855, "loss": 1.011, "accuracy": 1.0, "learning_rate": 1.5911177381725194e-05, "epoch": 0.6184364060676779, "percentage": 61.84, "elapsed_time": "3:37:33", "remaining_time": "2:14:13", "throughput": 794.48, "total_tokens": 10370448} {"current_steps": 7960, "total_steps": 12855, "loss": 0.98, "accuracy": 0.699999988079071, "learning_rate": 1.585428850375286e-05, "epoch": 0.6192143134966939, "percentage": 61.92, "elapsed_time": "3:37:43", "remaining_time": "2:13:53", "throughput": 794.65, "total_tokens": 10381040} {"current_steps": 7970, "total_steps": 12855, "loss": 0.8969, "accuracy": 0.8999999761581421, "learning_rate": 1.5797454248442932e-05, "epoch": 0.6199922209257098, "percentage": 62.0, "elapsed_time": "3:37:55", "remaining_time": "2:13:34", "throughput": 794.83, "total_tokens": 10392496} {"current_steps": 7980, "total_steps": 12855, "loss": 0.9891, "accuracy": 1.0, "learning_rate": 1.5740674955237383e-05, "epoch": 0.6207701283547258, "percentage": 62.08, "elapsed_time": "3:38:11", "remaining_time": "2:13:17", "throughput": 794.9, "total_tokens": 10406624} {"current_steps": 7990, "total_steps": 12855, "loss": 0.7915, "accuracy": 1.0, "learning_rate": 1.568395096324992e-05, "epoch": 0.6215480357837417, "percentage": 62.15, "elapsed_time": "3:38:27", "remaining_time": "2:13:01", "throughput": 794.97, "total_tokens": 10420240} {"current_steps": 8000, "total_steps": 12855, "loss": 1.7128, "accuracy": 0.800000011920929, "learning_rate": 1.562728261126398e-05, "epoch": 0.6223259432127577, "percentage": 62.23, "elapsed_time": "3:38:42", "remaining_time": "2:12:43", "throughput": 795.12, "total_tokens": 10434064} {"current_steps": 8010, "total_steps": 12855, "loss": 0.9822, "accuracy": 0.8999999761581421, "learning_rate": 1.557067023773066e-05, "epoch": 0.6231038506417736, "percentage": 62.31, "elapsed_time": "3:39:08", "remaining_time": "2:12:33", "throughput": 794.73, "total_tokens": 10449616} {"current_steps": 8020, "total_steps": 12855, "loss": 1.0497, "accuracy": 1.0, "learning_rate": 1.5514114180766758e-05, "epoch": 0.6238817580707896, "percentage": 62.39, "elapsed_time": "3:39:22", "remaining_time": "2:12:15", "throughput": 794.82, "total_tokens": 10462192} {"current_steps": 8030, "total_steps": 12855, "loss": 0.994, "accuracy": 1.0, "learning_rate": 1.5457614778152696e-05, "epoch": 0.6246596654998056, "percentage": 62.47, "elapsed_time": "3:39:36", "remaining_time": "2:11:57", "throughput": 795.01, "total_tokens": 10475648} {"current_steps": 8040, "total_steps": 12855, "loss": 0.9753, "accuracy": 0.8999999761581421, "learning_rate": 1.5401172367330563e-05, "epoch": 0.6254375729288215, "percentage": 62.54, "elapsed_time": "3:39:50", "remaining_time": "2:11:39", "throughput": 795.05, "total_tokens": 10487008} {"current_steps": 8050, "total_steps": 12855, "loss": 0.9275, "accuracy": 1.0, "learning_rate": 1.5344787285402036e-05, "epoch": 0.6262154803578374, "percentage": 62.62, "elapsed_time": "3:40:02", "remaining_time": "2:11:20", "throughput": 795.27, "total_tokens": 10499472} {"current_steps": 8060, "total_steps": 12855, "loss": 1.0396, "accuracy": 0.800000011920929, "learning_rate": 1.528845986912639e-05, "epoch": 0.6269933877868533, "percentage": 62.7, "elapsed_time": "3:40:24", "remaining_time": "2:11:07", "throughput": 795.18, "total_tokens": 10515952} {"current_steps": 8070, "total_steps": 12855, "loss": 0.933, "accuracy": 0.8999999761581421, "learning_rate": 1.5232190454918518e-05, "epoch": 0.6277712952158693, "percentage": 62.78, "elapsed_time": "3:40:43", "remaining_time": "2:10:52", "throughput": 795.08, "total_tokens": 10529248} {"current_steps": 8080, "total_steps": 12855, "loss": 1.017, "accuracy": 0.8999999761581421, "learning_rate": 1.5175979378846874e-05, "epoch": 0.6285492026448852, "percentage": 62.85, "elapsed_time": "3:41:00", "remaining_time": "2:10:36", "throughput": 795.02, "total_tokens": 10542224} {"current_steps": 8090, "total_steps": 12855, "loss": 0.9892, "accuracy": 0.8999999761581421, "learning_rate": 1.511982697663151e-05, "epoch": 0.6293271100739012, "percentage": 62.93, "elapsed_time": "3:41:09", "remaining_time": "2:10:15", "throughput": 795.16, "total_tokens": 10551648} {"current_steps": 8100, "total_steps": 12855, "loss": 1.3798, "accuracy": 0.8999999761581421, "learning_rate": 1.5063733583642031e-05, "epoch": 0.6301050175029171, "percentage": 63.01, "elapsed_time": "3:41:21", "remaining_time": "2:09:56", "throughput": 795.32, "total_tokens": 10562768} {"current_steps": 8110, "total_steps": 12855, "loss": 0.9213, "accuracy": 0.8999999761581421, "learning_rate": 1.500769953489562e-05, "epoch": 0.6308829249319331, "percentage": 63.09, "elapsed_time": "3:41:42", "remaining_time": "2:09:42", "throughput": 795.38, "total_tokens": 10580176} {"current_steps": 8120, "total_steps": 12855, "loss": 1.1974, "accuracy": 1.0, "learning_rate": 1.495172516505502e-05, "epoch": 0.631660832360949, "percentage": 63.17, "elapsed_time": "3:42:03", "remaining_time": "2:09:29", "throughput": 795.29, "total_tokens": 10595664} {"current_steps": 8130, "total_steps": 12855, "loss": 0.7445, "accuracy": 1.0, "learning_rate": 1.4895810808426547e-05, "epoch": 0.632438739789965, "percentage": 63.24, "elapsed_time": "3:42:18", "remaining_time": "2:09:12", "throughput": 795.34, "total_tokens": 10609008} {"current_steps": 8140, "total_steps": 12855, "loss": 0.9567, "accuracy": 1.0, "learning_rate": 1.4839956798958088e-05, "epoch": 0.633216647218981, "percentage": 63.32, "elapsed_time": "3:42:35", "remaining_time": "2:08:56", "throughput": 795.31, "total_tokens": 10622096} {"current_steps": 8150, "total_steps": 12855, "loss": 0.8871, "accuracy": 1.0, "learning_rate": 1.4784163470237105e-05, "epoch": 0.6339945546479969, "percentage": 63.4, "elapsed_time": "3:42:51", "remaining_time": "2:08:39", "throughput": 795.34, "total_tokens": 10635136} {"current_steps": 8160, "total_steps": 12855, "loss": 0.7239, "accuracy": 1.0, "learning_rate": 1.4728431155488648e-05, "epoch": 0.6347724620770129, "percentage": 63.48, "elapsed_time": "3:43:02", "remaining_time": "2:08:19", "throughput": 795.5, "total_tokens": 10645920} {"current_steps": 8170, "total_steps": 12855, "loss": 1.1202, "accuracy": 0.800000011920929, "learning_rate": 1.4672760187573361e-05, "epoch": 0.6355503695060288, "percentage": 63.56, "elapsed_time": "3:43:14", "remaining_time": "2:08:00", "throughput": 795.62, "total_tokens": 10657040} {"current_steps": 8180, "total_steps": 12855, "loss": 0.6829, "accuracy": 1.0, "learning_rate": 1.4617150898985504e-05, "epoch": 0.6363282769350447, "percentage": 63.63, "elapsed_time": "3:43:34", "remaining_time": "2:07:46", "throughput": 795.66, "total_tokens": 10673296} {"current_steps": 8190, "total_steps": 12855, "loss": 1.039, "accuracy": 1.0, "learning_rate": 1.4561603621850933e-05, "epoch": 0.6371061843640606, "percentage": 63.71, "elapsed_time": "3:43:48", "remaining_time": "2:07:28", "throughput": 795.85, "total_tokens": 10686848} {"current_steps": 8200, "total_steps": 12855, "loss": 0.8505, "accuracy": 0.8999999761581421, "learning_rate": 1.4506118687925158e-05, "epoch": 0.6378840917930766, "percentage": 63.79, "elapsed_time": "3:44:04", "remaining_time": "2:07:11", "throughput": 795.83, "total_tokens": 10699184} {"current_steps": 8210, "total_steps": 12855, "loss": 0.8932, "accuracy": 0.8999999761581421, "learning_rate": 1.4450696428591346e-05, "epoch": 0.6386619992220925, "percentage": 63.87, "elapsed_time": "3:44:19", "remaining_time": "2:06:55", "throughput": 796.04, "total_tokens": 10714544} {"current_steps": 8220, "total_steps": 12855, "loss": 0.9208, "accuracy": 0.8999999761581421, "learning_rate": 1.4395337174858336e-05, "epoch": 0.6394399066511085, "percentage": 63.94, "elapsed_time": "3:44:40", "remaining_time": "2:06:41", "throughput": 795.93, "total_tokens": 10729824} {"current_steps": 8230, "total_steps": 12855, "loss": 1.0354, "accuracy": 1.0, "learning_rate": 1.4340041257358678e-05, "epoch": 0.6402178140801245, "percentage": 64.02, "elapsed_time": "3:44:56", "remaining_time": "2:06:24", "throughput": 795.92, "total_tokens": 10742416} {"current_steps": 8240, "total_steps": 12855, "loss": 0.9911, "accuracy": 0.8999999761581421, "learning_rate": 1.4284809006346625e-05, "epoch": 0.6409957215091404, "percentage": 64.1, "elapsed_time": "3:45:16", "remaining_time": "2:06:10", "throughput": 795.94, "total_tokens": 10758448} {"current_steps": 8250, "total_steps": 12855, "loss": 0.8629, "accuracy": 1.0, "learning_rate": 1.4229640751696194e-05, "epoch": 0.6417736289381564, "percentage": 64.18, "elapsed_time": "3:45:29", "remaining_time": "2:05:51", "throughput": 796.07, "total_tokens": 10770160} {"current_steps": 8260, "total_steps": 12855, "loss": 0.7704, "accuracy": 0.8999999761581421, "learning_rate": 1.4174536822899201e-05, "epoch": 0.6425515363671723, "percentage": 64.26, "elapsed_time": "3:45:36", "remaining_time": "2:05:30", "throughput": 796.22, "total_tokens": 10778368} {"current_steps": 8270, "total_steps": 12855, "loss": 0.6591, "accuracy": 0.8999999761581421, "learning_rate": 1.4119497549063254e-05, "epoch": 0.6433294437961883, "percentage": 64.33, "elapsed_time": "3:45:59", "remaining_time": "2:05:17", "throughput": 796.03, "total_tokens": 10793760} {"current_steps": 8280, "total_steps": 12855, "loss": 1.4628, "accuracy": 0.8999999761581421, "learning_rate": 1.4064523258909812e-05, "epoch": 0.6441073512252042, "percentage": 64.41, "elapsed_time": "3:46:14", "remaining_time": "2:05:00", "throughput": 796.09, "total_tokens": 10806208} {"current_steps": 8290, "total_steps": 12855, "loss": 0.9929, "accuracy": 0.8999999761581421, "learning_rate": 1.4009614280772232e-05, "epoch": 0.6448852586542202, "percentage": 64.49, "elapsed_time": "3:46:39", "remaining_time": "2:04:48", "throughput": 795.7, "total_tokens": 10821328} {"current_steps": 8300, "total_steps": 12855, "loss": 0.9003, "accuracy": 1.0, "learning_rate": 1.3954770942593799e-05, "epoch": 0.645663166083236, "percentage": 64.57, "elapsed_time": "3:46:49", "remaining_time": "2:04:28", "throughput": 795.79, "total_tokens": 10829936} {"current_steps": 8310, "total_steps": 12855, "loss": 0.9982, "accuracy": 0.800000011920929, "learning_rate": 1.3899993571925723e-05, "epoch": 0.646441073512252, "percentage": 64.64, "elapsed_time": "3:47:03", "remaining_time": "2:04:11", "throughput": 795.82, "total_tokens": 10841696} {"current_steps": 8320, "total_steps": 12855, "loss": 0.7966, "accuracy": 1.0, "learning_rate": 1.3845282495925277e-05, "epoch": 0.647218980941268, "percentage": 64.72, "elapsed_time": "3:47:25", "remaining_time": "2:03:57", "throughput": 795.76, "total_tokens": 10858688} {"current_steps": 8330, "total_steps": 12855, "loss": 1.0353, "accuracy": 0.800000011920929, "learning_rate": 1.379063804135376e-05, "epoch": 0.6479968883702839, "percentage": 64.8, "elapsed_time": "3:47:45", "remaining_time": "2:03:43", "throughput": 795.73, "total_tokens": 10873904} {"current_steps": 8340, "total_steps": 12855, "loss": 1.0799, "accuracy": 1.0, "learning_rate": 1.373606053457458e-05, "epoch": 0.6487747957992999, "percentage": 64.88, "elapsed_time": "3:48:21", "remaining_time": "2:03:37", "throughput": 795.14, "total_tokens": 10894304} {"current_steps": 8350, "total_steps": 12855, "loss": 0.7538, "accuracy": 1.0, "learning_rate": 1.368155030155131e-05, "epoch": 0.6495527032283158, "percentage": 64.96, "elapsed_time": "3:48:38", "remaining_time": "2:03:21", "throughput": 795.17, "total_tokens": 10908752} {"current_steps": 8360, "total_steps": 12855, "loss": 0.8713, "accuracy": 0.800000011920929, "learning_rate": 1.3627107667845717e-05, "epoch": 0.6503306106573318, "percentage": 65.03, "elapsed_time": "3:48:54", "remaining_time": "2:03:04", "throughput": 795.25, "total_tokens": 10922384} {"current_steps": 8370, "total_steps": 12855, "loss": 0.8994, "accuracy": 0.8999999761581421, "learning_rate": 1.3572732958615847e-05, "epoch": 0.6511085180863477, "percentage": 65.11, "elapsed_time": "3:49:10", "remaining_time": "2:02:48", "throughput": 795.26, "total_tokens": 10935392} {"current_steps": 8380, "total_steps": 12855, "loss": 0.9469, "accuracy": 1.0, "learning_rate": 1.3518426498614039e-05, "epoch": 0.6518864255153637, "percentage": 65.19, "elapsed_time": "3:49:44", "remaining_time": "2:02:41", "throughput": 794.39, "total_tokens": 10950480} {"current_steps": 8390, "total_steps": 12855, "loss": 0.7573, "accuracy": 0.800000011920929, "learning_rate": 1.3464188612185058e-05, "epoch": 0.6526643329443796, "percentage": 65.27, "elapsed_time": "3:50:03", "remaining_time": "2:02:25", "throughput": 794.39, "total_tokens": 10965280} {"current_steps": 8400, "total_steps": 12855, "loss": 1.0475, "accuracy": 0.800000011920929, "learning_rate": 1.3410019623264085e-05, "epoch": 0.6534422403733956, "percentage": 65.34, "elapsed_time": "3:50:17", "remaining_time": "2:02:08", "throughput": 794.44, "total_tokens": 10977376} {"current_steps": 8410, "total_steps": 12855, "loss": 0.9106, "accuracy": 0.8999999761581421, "learning_rate": 1.3355919855374816e-05, "epoch": 0.6542201478024116, "percentage": 65.42, "elapsed_time": "3:50:26", "remaining_time": "2:01:47", "throughput": 794.59, "total_tokens": 10986112} {"current_steps": 8420, "total_steps": 12855, "loss": 0.8656, "accuracy": 1.0, "learning_rate": 1.3301889631627517e-05, "epoch": 0.6549980552314275, "percentage": 65.5, "elapsed_time": "3:50:43", "remaining_time": "2:01:31", "throughput": 794.71, "total_tokens": 11001168} {"current_steps": 8430, "total_steps": 12855, "loss": 0.7249, "accuracy": 0.800000011920929, "learning_rate": 1.3247929274717134e-05, "epoch": 0.6557759626604434, "percentage": 65.58, "elapsed_time": "3:50:52", "remaining_time": "2:01:11", "throughput": 794.89, "total_tokens": 11011248} {"current_steps": 8440, "total_steps": 12855, "loss": 0.8746, "accuracy": 1.0, "learning_rate": 1.3194039106921285e-05, "epoch": 0.6565538700894593, "percentage": 65.66, "elapsed_time": "3:51:12", "remaining_time": "2:00:56", "throughput": 794.97, "total_tokens": 11028512} {"current_steps": 8450, "total_steps": 12855, "loss": 0.8759, "accuracy": 0.8999999761581421, "learning_rate": 1.3140219450098418e-05, "epoch": 0.6573317775184753, "percentage": 65.73, "elapsed_time": "3:51:26", "remaining_time": "2:00:38", "throughput": 795.05, "total_tokens": 11040240} {"current_steps": 8460, "total_steps": 12855, "loss": 1.0005, "accuracy": 1.0, "learning_rate": 1.3086470625685854e-05, "epoch": 0.6581096849474912, "percentage": 65.81, "elapsed_time": "3:51:43", "remaining_time": "2:00:22", "throughput": 795.13, "total_tokens": 11054704} {"current_steps": 8470, "total_steps": 12855, "loss": 0.8206, "accuracy": 1.0, "learning_rate": 1.3032792954697862e-05, "epoch": 0.6588875923765072, "percentage": 65.89, "elapsed_time": "3:52:02", "remaining_time": "2:00:07", "throughput": 795.15, "total_tokens": 11070592} {"current_steps": 8480, "total_steps": 12855, "loss": 0.982, "accuracy": 1.0, "learning_rate": 1.2979186757723744e-05, "epoch": 0.6596654998055231, "percentage": 65.97, "elapsed_time": "3:52:13", "remaining_time": "1:59:48", "throughput": 795.26, "total_tokens": 11080528} {"current_steps": 8490, "total_steps": 12855, "loss": 0.8463, "accuracy": 1.0, "learning_rate": 1.2925652354925927e-05, "epoch": 0.6604434072345391, "percentage": 66.04, "elapsed_time": "3:52:24", "remaining_time": "1:59:29", "throughput": 795.37, "total_tokens": 11090880} {"current_steps": 8500, "total_steps": 12855, "loss": 1.0242, "accuracy": 0.800000011920929, "learning_rate": 1.2872190066038056e-05, "epoch": 0.661221314663555, "percentage": 66.12, "elapsed_time": "3:52:39", "remaining_time": "1:59:11", "throughput": 795.47, "total_tokens": 11104016} {"current_steps": 8510, "total_steps": 12855, "loss": 0.8629, "accuracy": 0.800000011920929, "learning_rate": 1.2818800210363063e-05, "epoch": 0.661999222092571, "percentage": 66.2, "elapsed_time": "3:52:54", "remaining_time": "1:58:55", "throughput": 795.56, "total_tokens": 11117712} {"current_steps": 8520, "total_steps": 12855, "loss": 0.9358, "accuracy": 1.0, "learning_rate": 1.2765483106771275e-05, "epoch": 0.662777129521587, "percentage": 66.28, "elapsed_time": "3:53:09", "remaining_time": "1:58:37", "throughput": 795.72, "total_tokens": 11131488} {"current_steps": 8530, "total_steps": 12855, "loss": 0.9689, "accuracy": 0.8999999761581421, "learning_rate": 1.271223907369853e-05, "epoch": 0.6635550369506029, "percentage": 66.36, "elapsed_time": "3:53:20", "remaining_time": "1:58:18", "throughput": 795.77, "total_tokens": 11141600} {"current_steps": 8540, "total_steps": 12855, "loss": 0.8566, "accuracy": 0.800000011920929, "learning_rate": 1.2659068429144228e-05, "epoch": 0.6643329443796189, "percentage": 66.43, "elapsed_time": "3:53:48", "remaining_time": "1:58:08", "throughput": 795.18, "total_tokens": 11155056} {"current_steps": 8550, "total_steps": 12855, "loss": 0.7653, "accuracy": 1.0, "learning_rate": 1.2605971490669471e-05, "epoch": 0.6651108518086347, "percentage": 66.51, "elapsed_time": "3:54:07", "remaining_time": "1:57:52", "throughput": 795.27, "total_tokens": 11171168} {"current_steps": 8560, "total_steps": 12855, "loss": 1.0221, "accuracy": 0.5, "learning_rate": 1.2552948575395135e-05, "epoch": 0.6658887592376507, "percentage": 66.59, "elapsed_time": "3:54:17", "remaining_time": "1:57:33", "throughput": 795.38, "total_tokens": 11181328} {"current_steps": 8570, "total_steps": 12855, "loss": 0.8437, "accuracy": 1.0, "learning_rate": 1.2500000000000006e-05, "epoch": 0.6666666666666666, "percentage": 66.67, "elapsed_time": "3:54:28", "remaining_time": "1:57:14", "throughput": 795.49, "total_tokens": 11191392} {"current_steps": 8580, "total_steps": 12855, "loss": 0.8278, "accuracy": 1.0, "learning_rate": 1.2447126080718876e-05, "epoch": 0.6674445740956826, "percentage": 66.74, "elapsed_time": "3:54:51", "remaining_time": "1:57:00", "throughput": 795.39, "total_tokens": 11207888} {"current_steps": 8590, "total_steps": 12855, "loss": 0.9001, "accuracy": 1.0, "learning_rate": 1.2394327133340658e-05, "epoch": 0.6682224815246985, "percentage": 66.82, "elapsed_time": "3:55:05", "remaining_time": "1:56:43", "throughput": 795.47, "total_tokens": 11220624} {"current_steps": 8600, "total_steps": 12855, "loss": 1.4506, "accuracy": 0.800000011920929, "learning_rate": 1.2341603473206486e-05, "epoch": 0.6690003889537145, "percentage": 66.9, "elapsed_time": "3:55:18", "remaining_time": "1:56:25", "throughput": 795.61, "total_tokens": 11232528} {"current_steps": 8610, "total_steps": 12855, "loss": 0.9102, "accuracy": 1.0, "learning_rate": 1.2288955415207848e-05, "epoch": 0.6697782963827305, "percentage": 66.98, "elapsed_time": "3:55:32", "remaining_time": "1:56:08", "throughput": 795.64, "total_tokens": 11244800} {"current_steps": 8620, "total_steps": 12855, "loss": 0.9622, "accuracy": 0.8999999761581421, "learning_rate": 1.2236383273784696e-05, "epoch": 0.6705562038117464, "percentage": 67.06, "elapsed_time": "3:55:45", "remaining_time": "1:55:49", "throughput": 795.62, "total_tokens": 11254816} {"current_steps": 8630, "total_steps": 12855, "loss": 0.9647, "accuracy": 1.0, "learning_rate": 1.2183887362923577e-05, "epoch": 0.6713341112407624, "percentage": 67.13, "elapsed_time": "3:55:55", "remaining_time": "1:55:30", "throughput": 795.78, "total_tokens": 11264864} {"current_steps": 8640, "total_steps": 12855, "loss": 0.88, "accuracy": 0.8999999761581421, "learning_rate": 1.213146799615574e-05, "epoch": 0.6721120186697783, "percentage": 67.21, "elapsed_time": "3:56:06", "remaining_time": "1:55:11", "throughput": 795.95, "total_tokens": 11275808} {"current_steps": 8650, "total_steps": 12855, "loss": 0.8771, "accuracy": 0.8999999761581421, "learning_rate": 1.2079125486555279e-05, "epoch": 0.6728899260987943, "percentage": 67.29, "elapsed_time": "3:56:20", "remaining_time": "1:54:53", "throughput": 796.12, "total_tokens": 11289264} {"current_steps": 8660, "total_steps": 12855, "loss": 0.8308, "accuracy": 1.0, "learning_rate": 1.2026860146737281e-05, "epoch": 0.6736678335278102, "percentage": 67.37, "elapsed_time": "3:56:35", "remaining_time": "1:54:36", "throughput": 796.15, "total_tokens": 11301696} {"current_steps": 8670, "total_steps": 12855, "loss": 0.9782, "accuracy": 0.8999999761581421, "learning_rate": 1.1974672288855912e-05, "epoch": 0.6744457409568262, "percentage": 67.44, "elapsed_time": "3:56:50", "remaining_time": "1:54:19", "throughput": 796.28, "total_tokens": 11315600} {"current_steps": 8680, "total_steps": 12855, "loss": 0.9351, "accuracy": 0.8999999761581421, "learning_rate": 1.192256222460259e-05, "epoch": 0.675223648385842, "percentage": 67.52, "elapsed_time": "3:57:04", "remaining_time": "1:54:01", "throughput": 796.52, "total_tokens": 11329840} {"current_steps": 8690, "total_steps": 12855, "loss": 0.9687, "accuracy": 1.0, "learning_rate": 1.1870530265204091e-05, "epoch": 0.676001555814858, "percentage": 67.6, "elapsed_time": "3:57:18", "remaining_time": "1:53:44", "throughput": 796.58, "total_tokens": 11342304} {"current_steps": 8700, "total_steps": 12855, "loss": 0.9763, "accuracy": 1.0, "learning_rate": 1.1818576721420734e-05, "epoch": 0.676779463243874, "percentage": 67.68, "elapsed_time": "3:57:56", "remaining_time": "1:53:38", "throughput": 795.75, "total_tokens": 11360608} {"current_steps": 8710, "total_steps": 12855, "loss": 0.7904, "accuracy": 0.800000011920929, "learning_rate": 1.1766701903544497e-05, "epoch": 0.6775573706728899, "percentage": 67.76, "elapsed_time": "3:58:15", "remaining_time": "1:53:22", "throughput": 795.69, "total_tokens": 11374576} {"current_steps": 8720, "total_steps": 12855, "loss": 1.1281, "accuracy": 1.0, "learning_rate": 1.1714906121397162e-05, "epoch": 0.6783352781019059, "percentage": 67.83, "elapsed_time": "3:58:35", "remaining_time": "1:53:08", "throughput": 795.74, "total_tokens": 11391488} {"current_steps": 8730, "total_steps": 12855, "loss": 0.8148, "accuracy": 1.0, "learning_rate": 1.166318968432848e-05, "epoch": 0.6791131855309218, "percentage": 67.91, "elapsed_time": "3:58:49", "remaining_time": "1:52:51", "throughput": 795.87, "total_tokens": 11404816} {"current_steps": 8740, "total_steps": 12855, "loss": 1.0578, "accuracy": 1.0, "learning_rate": 1.16115529012143e-05, "epoch": 0.6798910929599378, "percentage": 67.99, "elapsed_time": "3:59:11", "remaining_time": "1:52:36", "throughput": 795.97, "total_tokens": 11423280} {"current_steps": 8750, "total_steps": 12855, "loss": 1.0336, "accuracy": 0.8999999761581421, "learning_rate": 1.1559996080454752e-05, "epoch": 0.6806690003889537, "percentage": 68.07, "elapsed_time": "3:59:23", "remaining_time": "1:52:18", "throughput": 796.14, "total_tokens": 11435520} {"current_steps": 8760, "total_steps": 12855, "loss": 0.8583, "accuracy": 1.0, "learning_rate": 1.150851952997239e-05, "epoch": 0.6814469078179697, "percentage": 68.14, "elapsed_time": "3:59:37", "remaining_time": "1:52:01", "throughput": 796.26, "total_tokens": 11448432} {"current_steps": 8770, "total_steps": 12855, "loss": 0.8311, "accuracy": 0.8999999761581421, "learning_rate": 1.1457123557210347e-05, "epoch": 0.6822248152469856, "percentage": 68.22, "elapsed_time": "3:59:49", "remaining_time": "1:51:42", "throughput": 796.25, "total_tokens": 11457328} {"current_steps": 8780, "total_steps": 12855, "loss": 0.9736, "accuracy": 1.0, "learning_rate": 1.1405808469130504e-05, "epoch": 0.6830027226760016, "percentage": 68.3, "elapsed_time": "4:00:04", "remaining_time": "1:51:25", "throughput": 796.37, "total_tokens": 11471040} {"current_steps": 8790, "total_steps": 12855, "loss": 0.7804, "accuracy": 0.8999999761581421, "learning_rate": 1.1354574572211685e-05, "epoch": 0.6837806301050176, "percentage": 68.38, "elapsed_time": "4:00:19", "remaining_time": "1:51:08", "throughput": 796.38, "total_tokens": 11483152} {"current_steps": 8800, "total_steps": 12855, "loss": 0.7664, "accuracy": 1.0, "learning_rate": 1.1303422172447781e-05, "epoch": 0.6845585375340334, "percentage": 68.46, "elapsed_time": "4:00:30", "remaining_time": "1:50:49", "throughput": 796.55, "total_tokens": 11494192} {"current_steps": 8810, "total_steps": 12855, "loss": 0.7949, "accuracy": 1.0, "learning_rate": 1.1252351575345923e-05, "epoch": 0.6853364449630494, "percentage": 68.53, "elapsed_time": "4:00:46", "remaining_time": "1:50:32", "throughput": 796.68, "total_tokens": 11509200} {"current_steps": 8820, "total_steps": 12855, "loss": 1.0021, "accuracy": 0.8999999761581421, "learning_rate": 1.1201363085924709e-05, "epoch": 0.6861143523920653, "percentage": 68.61, "elapsed_time": "4:01:01", "remaining_time": "1:50:16", "throughput": 796.73, "total_tokens": 11522208} {"current_steps": 8830, "total_steps": 12855, "loss": 0.9748, "accuracy": 1.0, "learning_rate": 1.1150457008712337e-05, "epoch": 0.6868922598210813, "percentage": 68.69, "elapsed_time": "4:01:35", "remaining_time": "1:50:07", "throughput": 796.01, "total_tokens": 11538160} {"current_steps": 8840, "total_steps": 12855, "loss": 2.6104, "accuracy": 1.0, "learning_rate": 1.1099633647744797e-05, "epoch": 0.6876701672500972, "percentage": 68.77, "elapsed_time": "4:01:54", "remaining_time": "1:49:52", "throughput": 795.97, "total_tokens": 11552928} {"current_steps": 8850, "total_steps": 12855, "loss": 0.892, "accuracy": 1.0, "learning_rate": 1.1048893306564062e-05, "epoch": 0.6884480746791132, "percentage": 68.84, "elapsed_time": "4:02:08", "remaining_time": "1:49:34", "throughput": 796.0, "total_tokens": 11564832} {"current_steps": 8860, "total_steps": 12855, "loss": 0.8744, "accuracy": 1.0, "learning_rate": 1.0998236288216265e-05, "epoch": 0.6892259821081291, "percentage": 68.92, "elapsed_time": "4:02:26", "remaining_time": "1:49:18", "throughput": 796.05, "total_tokens": 11579696} {"current_steps": 8870, "total_steps": 12855, "loss": 0.87, "accuracy": 1.0, "learning_rate": 1.0947662895249896e-05, "epoch": 0.6900038895371451, "percentage": 69.0, "elapsed_time": "4:02:44", "remaining_time": "1:49:03", "throughput": 796.2, "total_tokens": 11596480} {"current_steps": 8880, "total_steps": 12855, "loss": 0.9965, "accuracy": 1.0, "learning_rate": 1.0897173429714e-05, "epoch": 0.690781796966161, "percentage": 69.08, "elapsed_time": "4:03:09", "remaining_time": "1:48:50", "throughput": 796.17, "total_tokens": 11615344} {"current_steps": 8890, "total_steps": 12855, "loss": 0.8733, "accuracy": 1.0, "learning_rate": 1.0846768193156357e-05, "epoch": 0.691559704395177, "percentage": 69.16, "elapsed_time": "4:03:21", "remaining_time": "1:48:32", "throughput": 796.24, "total_tokens": 11626128} {"current_steps": 8900, "total_steps": 12855, "loss": 0.8323, "accuracy": 0.8999999761581421, "learning_rate": 1.0796447486621694e-05, "epoch": 0.692337611824193, "percentage": 69.23, "elapsed_time": "4:03:30", "remaining_time": "1:48:12", "throughput": 796.4, "total_tokens": 11635776} {"current_steps": 8910, "total_steps": 12855, "loss": 0.7968, "accuracy": 1.0, "learning_rate": 1.0746211610649873e-05, "epoch": 0.6931155192532089, "percentage": 69.31, "elapsed_time": "4:03:45", "remaining_time": "1:47:55", "throughput": 796.48, "total_tokens": 11648464} {"current_steps": 8920, "total_steps": 12855, "loss": 0.8646, "accuracy": 1.0, "learning_rate": 1.0696060865274139e-05, "epoch": 0.6938934266822249, "percentage": 69.39, "elapsed_time": "4:04:06", "remaining_time": "1:47:40", "throughput": 796.34, "total_tokens": 11663152} {"current_steps": 8930, "total_steps": 12855, "loss": 0.8549, "accuracy": 1.0, "learning_rate": 1.0645995550019266e-05, "epoch": 0.6946713341112407, "percentage": 69.47, "elapsed_time": "4:04:26", "remaining_time": "1:47:26", "throughput": 796.39, "total_tokens": 11679952} {"current_steps": 8940, "total_steps": 12855, "loss": 0.8793, "accuracy": 0.8999999761581421, "learning_rate": 1.0596015963899792e-05, "epoch": 0.6954492415402567, "percentage": 69.54, "elapsed_time": "4:04:48", "remaining_time": "1:47:12", "throughput": 796.13, "total_tokens": 11694208} {"current_steps": 8950, "total_steps": 12855, "loss": 0.8759, "accuracy": 1.0, "learning_rate": 1.054612240541826e-05, "epoch": 0.6962271489692726, "percentage": 69.62, "elapsed_time": "4:05:00", "remaining_time": "1:46:53", "throughput": 796.24, "total_tokens": 11705008} {"current_steps": 8960, "total_steps": 12855, "loss": 0.9931, "accuracy": 1.0, "learning_rate": 1.0496315172563404e-05, "epoch": 0.6970050563982886, "percentage": 69.7, "elapsed_time": "4:05:15", "remaining_time": "1:46:37", "throughput": 796.2, "total_tokens": 11716576} {"current_steps": 8970, "total_steps": 12855, "loss": 0.8171, "accuracy": 0.8999999761581421, "learning_rate": 1.0446594562808382e-05, "epoch": 0.6977829638273045, "percentage": 69.78, "elapsed_time": "4:05:35", "remaining_time": "1:46:21", "throughput": 796.23, "total_tokens": 11732480} {"current_steps": 8980, "total_steps": 12855, "loss": 0.9468, "accuracy": 1.0, "learning_rate": 1.0396960873108992e-05, "epoch": 0.6985608712563205, "percentage": 69.86, "elapsed_time": "4:05:48", "remaining_time": "1:46:04", "throughput": 796.35, "total_tokens": 11744784} {"current_steps": 8990, "total_steps": 12855, "loss": 1.062, "accuracy": 1.0, "learning_rate": 1.0347414399901908e-05, "epoch": 0.6993387786853364, "percentage": 69.93, "elapsed_time": "4:06:04", "remaining_time": "1:45:47", "throughput": 796.37, "total_tokens": 11757712} {"current_steps": 9000, "total_steps": 12855, "loss": 0.999, "accuracy": 1.0, "learning_rate": 1.0297955439102899e-05, "epoch": 0.7001166861143524, "percentage": 70.01, "elapsed_time": "4:06:13", "remaining_time": "1:45:27", "throughput": 796.56, "total_tokens": 11767792} {"current_steps": 9010, "total_steps": 12855, "loss": 0.7289, "accuracy": 1.0, "learning_rate": 1.0248584286105077e-05, "epoch": 0.7008945935433684, "percentage": 70.09, "elapsed_time": "4:06:30", "remaining_time": "1:45:11", "throughput": 796.36, "total_tokens": 11778512} {"current_steps": 9020, "total_steps": 12855, "loss": 1.0792, "accuracy": 0.800000011920929, "learning_rate": 1.0199301235777106e-05, "epoch": 0.7016725009723843, "percentage": 70.17, "elapsed_time": "4:06:52", "remaining_time": "1:44:57", "throughput": 796.31, "total_tokens": 11794976} {"current_steps": 9030, "total_steps": 12855, "loss": 0.7016, "accuracy": 1.0, "learning_rate": 1.0150106582461477e-05, "epoch": 0.7024504084014003, "percentage": 70.25, "elapsed_time": "4:07:04", "remaining_time": "1:44:39", "throughput": 796.4, "total_tokens": 11806400} {"current_steps": 9040, "total_steps": 12855, "loss": 0.8557, "accuracy": 0.8999999761581421, "learning_rate": 1.0101000619972708e-05, "epoch": 0.7032283158304162, "percentage": 70.32, "elapsed_time": "4:07:18", "remaining_time": "1:44:22", "throughput": 796.51, "total_tokens": 11818976} {"current_steps": 9050, "total_steps": 12855, "loss": 0.8437, "accuracy": 1.0, "learning_rate": 1.0051983641595658e-05, "epoch": 0.7040062232594321, "percentage": 70.4, "elapsed_time": "4:07:30", "remaining_time": "1:44:03", "throughput": 796.64, "total_tokens": 11830848} {"current_steps": 9060, "total_steps": 12855, "loss": 0.7572, "accuracy": 1.0, "learning_rate": 1.0003055940083661e-05, "epoch": 0.704784130688448, "percentage": 70.48, "elapsed_time": "4:07:40", "remaining_time": "1:43:44", "throughput": 796.77, "total_tokens": 11840480} {"current_steps": 9070, "total_steps": 12855, "loss": 3.6154, "accuracy": 1.0, "learning_rate": 9.954217807656898e-06, "epoch": 0.705562038117464, "percentage": 70.56, "elapsed_time": "4:07:52", "remaining_time": "1:43:26", "throughput": 796.82, "total_tokens": 11851088} {"current_steps": 9080, "total_steps": 12855, "loss": 0.8814, "accuracy": 0.8999999761581421, "learning_rate": 9.905469536000583e-06, "epoch": 0.7063399455464799, "percentage": 70.63, "elapsed_time": "4:08:05", "remaining_time": "1:43:08", "throughput": 796.89, "total_tokens": 11862384} {"current_steps": 9090, "total_steps": 12855, "loss": 0.678, "accuracy": 1.0, "learning_rate": 9.856811416263234e-06, "epoch": 0.7071178529754959, "percentage": 70.71, "elapsed_time": "4:08:21", "remaining_time": "1:42:51", "throughput": 797.01, "total_tokens": 11876304} {"current_steps": 9100, "total_steps": 12855, "loss": 1.0452, "accuracy": 1.0, "learning_rate": 9.808243739054945e-06, "epoch": 0.7078957604045119, "percentage": 70.79, "elapsed_time": "4:08:35", "remaining_time": "1:42:34", "throughput": 797.14, "total_tokens": 11889872} {"current_steps": 9110, "total_steps": 12855, "loss": 0.9186, "accuracy": 0.8999999761581421, "learning_rate": 9.75976679444564e-06, "epoch": 0.7086736678335278, "percentage": 70.87, "elapsed_time": "4:08:44", "remaining_time": "1:42:15", "throughput": 797.24, "total_tokens": 11898656} {"current_steps": 9120, "total_steps": 12855, "loss": 0.6738, "accuracy": 1.0, "learning_rate": 9.711380871963343e-06, "epoch": 0.7094515752625438, "percentage": 70.95, "elapsed_time": "4:09:04", "remaining_time": "1:42:00", "throughput": 797.09, "total_tokens": 11912496} {"current_steps": 9130, "total_steps": 12855, "loss": 0.7861, "accuracy": 1.0, "learning_rate": 9.663086260592447e-06, "epoch": 0.7102294826915597, "percentage": 71.02, "elapsed_time": "4:09:18", "remaining_time": "1:41:42", "throughput": 797.26, "total_tokens": 11925536} {"current_steps": 9140, "total_steps": 12855, "loss": 0.9792, "accuracy": 0.8999999761581421, "learning_rate": 9.614883248771996e-06, "epoch": 0.7110073901205757, "percentage": 71.1, "elapsed_time": "4:09:32", "remaining_time": "1:41:25", "throughput": 797.38, "total_tokens": 11938576} {"current_steps": 9150, "total_steps": 12855, "loss": 1.193, "accuracy": 0.8999999761581421, "learning_rate": 9.566772124393952e-06, "epoch": 0.7117852975495916, "percentage": 71.18, "elapsed_time": "4:09:45", "remaining_time": "1:41:07", "throughput": 797.58, "total_tokens": 11952224} {"current_steps": 9160, "total_steps": 12855, "loss": 0.9171, "accuracy": 0.800000011920929, "learning_rate": 9.518753174801484e-06, "epoch": 0.7125632049786076, "percentage": 71.26, "elapsed_time": "4:10:05", "remaining_time": "1:40:53", "throughput": 797.52, "total_tokens": 11967408} {"current_steps": 9170, "total_steps": 12855, "loss": 1.0997, "accuracy": 0.800000011920929, "learning_rate": 9.470826686787235e-06, "epoch": 0.7133411124076235, "percentage": 71.33, "elapsed_time": "4:10:20", "remaining_time": "1:40:36", "throughput": 797.62, "total_tokens": 11980944} {"current_steps": 9180, "total_steps": 12855, "loss": 0.9447, "accuracy": 1.0, "learning_rate": 9.42299294659166e-06, "epoch": 0.7141190198366394, "percentage": 71.41, "elapsed_time": "4:10:33", "remaining_time": "1:40:18", "throughput": 797.7, "total_tokens": 11992208} {"current_steps": 9190, "total_steps": 12855, "loss": 0.9496, "accuracy": 1.0, "learning_rate": 9.375252239901225e-06, "epoch": 0.7148969272656553, "percentage": 71.49, "elapsed_time": "4:10:44", "remaining_time": "1:39:59", "throughput": 797.85, "total_tokens": 12003008} {"current_steps": 9200, "total_steps": 12855, "loss": 0.7286, "accuracy": 1.0, "learning_rate": 9.327604851846791e-06, "epoch": 0.7156748346946713, "percentage": 71.57, "elapsed_time": "4:10:59", "remaining_time": "1:39:42", "throughput": 797.94, "total_tokens": 12016240} {"current_steps": 9210, "total_steps": 12855, "loss": 0.8197, "accuracy": 1.0, "learning_rate": 9.280051067001865e-06, "epoch": 0.7164527421236873, "percentage": 71.65, "elapsed_time": "4:11:08", "remaining_time": "1:39:23", "throughput": 798.15, "total_tokens": 12026816} {"current_steps": 9220, "total_steps": 12855, "loss": 0.9061, "accuracy": 1.0, "learning_rate": 9.232591169380912e-06, "epoch": 0.7172306495527032, "percentage": 71.72, "elapsed_time": "4:11:25", "remaining_time": "1:39:07", "throughput": 798.16, "total_tokens": 12040848} {"current_steps": 9230, "total_steps": 12855, "loss": 0.8145, "accuracy": 1.0, "learning_rate": 9.185225442437648e-06, "epoch": 0.7180085569817192, "percentage": 71.8, "elapsed_time": "4:11:39", "remaining_time": "1:38:50", "throughput": 798.2, "total_tokens": 12052192} {"current_steps": 9240, "total_steps": 12855, "loss": 0.7312, "accuracy": 1.0, "learning_rate": 9.137954169063365e-06, "epoch": 0.7187864644107351, "percentage": 71.88, "elapsed_time": "4:11:57", "remaining_time": "1:38:34", "throughput": 798.22, "total_tokens": 12067040} {"current_steps": 9250, "total_steps": 12855, "loss": 0.8557, "accuracy": 0.8999999761581421, "learning_rate": 9.09077763158523e-06, "epoch": 0.7195643718397511, "percentage": 71.96, "elapsed_time": "4:12:16", "remaining_time": "1:38:19", "throughput": 798.26, "total_tokens": 12083264} {"current_steps": 9260, "total_steps": 12855, "loss": 0.8535, "accuracy": 0.8999999761581421, "learning_rate": 9.043696111764598e-06, "epoch": 0.720342279268767, "percentage": 72.03, "elapsed_time": "4:12:49", "remaining_time": "1:38:09", "throughput": 797.71, "total_tokens": 12100672} {"current_steps": 9270, "total_steps": 12855, "loss": 0.9404, "accuracy": 1.0, "learning_rate": 8.996709890795338e-06, "epoch": 0.721120186697783, "percentage": 72.11, "elapsed_time": "4:12:59", "remaining_time": "1:37:50", "throughput": 797.88, "total_tokens": 12111344} {"current_steps": 9280, "total_steps": 12855, "loss": 0.9023, "accuracy": 1.0, "learning_rate": 8.949819249302138e-06, "epoch": 0.721898094126799, "percentage": 72.19, "elapsed_time": "4:13:15", "remaining_time": "1:37:34", "throughput": 798.04, "total_tokens": 12126928} {"current_steps": 9290, "total_steps": 12855, "loss": 1.2405, "accuracy": 1.0, "learning_rate": 8.903024467338846e-06, "epoch": 0.7226760015558149, "percentage": 72.27, "elapsed_time": "4:13:29", "remaining_time": "1:37:16", "throughput": 798.08, "total_tokens": 12138704} {"current_steps": 9300, "total_steps": 12855, "loss": 0.9524, "accuracy": 1.0, "learning_rate": 8.856325824386792e-06, "epoch": 0.7234539089848308, "percentage": 72.35, "elapsed_time": "4:13:40", "remaining_time": "1:36:58", "throughput": 798.14, "total_tokens": 12147984} {"current_steps": 9310, "total_steps": 12855, "loss": 0.9529, "accuracy": 0.8999999761581421, "learning_rate": 8.809723599353106e-06, "epoch": 0.7242318164138467, "percentage": 72.42, "elapsed_time": "4:13:56", "remaining_time": "1:36:41", "throughput": 798.17, "total_tokens": 12161680} {"current_steps": 9320, "total_steps": 12855, "loss": 0.9382, "accuracy": 1.0, "learning_rate": 8.763218070569073e-06, "epoch": 0.7250097238428627, "percentage": 72.5, "elapsed_time": "4:14:11", "remaining_time": "1:36:24", "throughput": 798.24, "total_tokens": 12174112} {"current_steps": 9330, "total_steps": 12855, "loss": 0.9378, "accuracy": 1.0, "learning_rate": 8.71680951578846e-06, "epoch": 0.7257876312718786, "percentage": 72.58, "elapsed_time": "4:14:28", "remaining_time": "1:36:08", "throughput": 798.28, "total_tokens": 12188144} {"current_steps": 9340, "total_steps": 12855, "loss": 0.8719, "accuracy": 0.800000011920929, "learning_rate": 8.670498212185854e-06, "epoch": 0.7265655387008946, "percentage": 72.66, "elapsed_time": "4:14:44", "remaining_time": "1:35:52", "throughput": 798.34, "total_tokens": 12202320} {"current_steps": 9350, "total_steps": 12855, "loss": 0.8026, "accuracy": 1.0, "learning_rate": 8.624284436355012e-06, "epoch": 0.7273434461299105, "percentage": 72.73, "elapsed_time": "4:15:06", "remaining_time": "1:35:37", "throughput": 798.26, "total_tokens": 12218336} {"current_steps": 9360, "total_steps": 12855, "loss": 0.6062, "accuracy": 1.0, "learning_rate": 8.578168464307206e-06, "epoch": 0.7281213535589265, "percentage": 72.81, "elapsed_time": "4:15:21", "remaining_time": "1:35:21", "throughput": 798.26, "total_tokens": 12230592} {"current_steps": 9370, "total_steps": 12855, "loss": 1.3069, "accuracy": 0.8999999761581421, "learning_rate": 8.53215057146958e-06, "epoch": 0.7288992609879424, "percentage": 72.89, "elapsed_time": "4:15:35", "remaining_time": "1:35:03", "throughput": 798.3, "total_tokens": 12242032} {"current_steps": 9380, "total_steps": 12855, "loss": 0.9206, "accuracy": 1.0, "learning_rate": 8.486231032683498e-06, "epoch": 0.7296771684169584, "percentage": 72.97, "elapsed_time": "4:16:01", "remaining_time": "1:34:51", "throughput": 798.08, "total_tokens": 12259872} {"current_steps": 9390, "total_steps": 12855, "loss": 0.9393, "accuracy": 0.800000011920929, "learning_rate": 8.440410122202902e-06, "epoch": 0.7304550758459744, "percentage": 73.05, "elapsed_time": "4:16:19", "remaining_time": "1:34:35", "throughput": 798.11, "total_tokens": 12274096} {"current_steps": 9400, "total_steps": 12855, "loss": 0.9588, "accuracy": 1.0, "learning_rate": 8.394688113692684e-06, "epoch": 0.7312329832749903, "percentage": 73.12, "elapsed_time": "4:16:35", "remaining_time": "1:34:18", "throughput": 798.17, "total_tokens": 12288448} {"current_steps": 9410, "total_steps": 12855, "loss": 0.9409, "accuracy": 0.8999999761581421, "learning_rate": 8.349065280227043e-06, "epoch": 0.7320108907040063, "percentage": 73.2, "elapsed_time": "4:16:49", "remaining_time": "1:34:01", "throughput": 798.25, "total_tokens": 12300544} {"current_steps": 9420, "total_steps": 12855, "loss": 0.9839, "accuracy": 1.0, "learning_rate": 8.303541894287853e-06, "epoch": 0.7327887981330222, "percentage": 73.28, "elapsed_time": "4:17:00", "remaining_time": "1:33:43", "throughput": 798.31, "total_tokens": 12310352} {"current_steps": 9430, "total_steps": 12855, "loss": 0.9301, "accuracy": 0.8999999761581421, "learning_rate": 8.258118227763042e-06, "epoch": 0.7335667055620381, "percentage": 73.36, "elapsed_time": "4:17:20", "remaining_time": "1:33:27", "throughput": 798.25, "total_tokens": 12325184} {"current_steps": 9440, "total_steps": 12855, "loss": 1.3908, "accuracy": 0.8999999761581421, "learning_rate": 8.212794551944968e-06, "epoch": 0.734344612991054, "percentage": 73.43, "elapsed_time": "4:17:34", "remaining_time": "1:33:10", "throughput": 798.4, "total_tokens": 12338624} {"current_steps": 9450, "total_steps": 12855, "loss": 0.7493, "accuracy": 0.8999999761581421, "learning_rate": 8.167571137528788e-06, "epoch": 0.73512252042007, "percentage": 73.51, "elapsed_time": "4:17:48", "remaining_time": "1:32:53", "throughput": 798.53, "total_tokens": 12351760} {"current_steps": 9460, "total_steps": 12855, "loss": 0.7375, "accuracy": 0.800000011920929, "learning_rate": 8.122448254610853e-06, "epoch": 0.7359004278490859, "percentage": 73.59, "elapsed_time": "4:18:04", "remaining_time": "1:32:36", "throughput": 798.58, "total_tokens": 12365376} {"current_steps": 9470, "total_steps": 12855, "loss": 0.935, "accuracy": 0.8999999761581421, "learning_rate": 8.077426172687092e-06, "epoch": 0.7366783352781019, "percentage": 73.67, "elapsed_time": "4:18:24", "remaining_time": "1:32:22", "throughput": 798.6, "total_tokens": 12382208} {"current_steps": 9480, "total_steps": 12855, "loss": 0.9444, "accuracy": 1.0, "learning_rate": 8.032505160651393e-06, "epoch": 0.7374562427071178, "percentage": 73.75, "elapsed_time": "4:18:36", "remaining_time": "1:32:04", "throughput": 798.8, "total_tokens": 12394752} {"current_steps": 9490, "total_steps": 12855, "loss": 0.7709, "accuracy": 1.0, "learning_rate": 7.987685486794021e-06, "epoch": 0.7382341501361338, "percentage": 73.82, "elapsed_time": "4:18:53", "remaining_time": "1:31:47", "throughput": 798.86, "total_tokens": 12408784} {"current_steps": 9500, "total_steps": 12855, "loss": 0.8703, "accuracy": 0.800000011920929, "learning_rate": 7.942967418799987e-06, "epoch": 0.7390120575651498, "percentage": 73.9, "elapsed_time": "4:19:06", "remaining_time": "1:31:30", "throughput": 798.96, "total_tokens": 12420784} {"current_steps": 9510, "total_steps": 12855, "loss": 0.8267, "accuracy": 1.0, "learning_rate": 7.898351223747463e-06, "epoch": 0.7397899649941657, "percentage": 73.98, "elapsed_time": "4:19:27", "remaining_time": "1:31:15", "throughput": 798.96, "total_tokens": 12437792} {"current_steps": 9520, "total_steps": 12855, "loss": 0.8718, "accuracy": 1.0, "learning_rate": 7.85383716810619e-06, "epoch": 0.7405678724231817, "percentage": 74.06, "elapsed_time": "4:19:41", "remaining_time": "1:30:58", "throughput": 799.03, "total_tokens": 12450464} {"current_steps": 9530, "total_steps": 12855, "loss": 0.8038, "accuracy": 0.800000011920929, "learning_rate": 7.809425517735882e-06, "epoch": 0.7413457798521976, "percentage": 74.13, "elapsed_time": "4:19:51", "remaining_time": "1:30:39", "throughput": 799.23, "total_tokens": 12460944} {"current_steps": 9540, "total_steps": 12855, "loss": 0.7145, "accuracy": 1.0, "learning_rate": 7.765116537884638e-06, "epoch": 0.7421236872812136, "percentage": 74.21, "elapsed_time": "4:20:08", "remaining_time": "1:30:23", "throughput": 799.32, "total_tokens": 12476384} {"current_steps": 9550, "total_steps": 12855, "loss": 0.9005, "accuracy": 1.0, "learning_rate": 7.720910493187353e-06, "epoch": 0.7429015947102294, "percentage": 74.29, "elapsed_time": "4:20:29", "remaining_time": "1:30:08", "throughput": 799.24, "total_tokens": 12491440} {"current_steps": 9560, "total_steps": 12855, "loss": 0.9569, "accuracy": 1.0, "learning_rate": 7.676807647664156e-06, "epoch": 0.7436795021392454, "percentage": 74.37, "elapsed_time": "4:20:35", "remaining_time": "1:29:49", "throughput": 799.4, "total_tokens": 12499264} {"current_steps": 9570, "total_steps": 12855, "loss": 0.9894, "accuracy": 0.8999999761581421, "learning_rate": 7.632808264718805e-06, "epoch": 0.7444574095682613, "percentage": 74.45, "elapsed_time": "4:20:53", "remaining_time": "1:29:33", "throughput": 799.43, "total_tokens": 12513984} {"current_steps": 9580, "total_steps": 12855, "loss": 0.9099, "accuracy": 0.8999999761581421, "learning_rate": 7.588912607137141e-06, "epoch": 0.7452353169972773, "percentage": 74.52, "elapsed_time": "4:21:10", "remaining_time": "1:29:17", "throughput": 799.44, "total_tokens": 12527952} {"current_steps": 9590, "total_steps": 12855, "loss": 0.8742, "accuracy": 0.800000011920929, "learning_rate": 7.545120937085498e-06, "epoch": 0.7460132244262933, "percentage": 74.6, "elapsed_time": "4:21:27", "remaining_time": "1:29:00", "throughput": 799.53, "total_tokens": 12542816} {"current_steps": 9600, "total_steps": 12855, "loss": 1.2204, "accuracy": 1.0, "learning_rate": 7.501433516109152e-06, "epoch": 0.7467911318553092, "percentage": 74.68, "elapsed_time": "4:21:48", "remaining_time": "1:28:46", "throughput": 799.44, "total_tokens": 12557728} {"current_steps": 9610, "total_steps": 12855, "loss": 0.7602, "accuracy": 1.0, "learning_rate": 7.457850605130745e-06, "epoch": 0.7475690392843252, "percentage": 74.76, "elapsed_time": "4:22:04", "remaining_time": "1:28:29", "throughput": 799.51, "total_tokens": 12571680} {"current_steps": 9620, "total_steps": 12855, "loss": 0.9254, "accuracy": 1.0, "learning_rate": 7.414372464448743e-06, "epoch": 0.7483469467133411, "percentage": 74.83, "elapsed_time": "4:22:14", "remaining_time": "1:28:11", "throughput": 799.57, "total_tokens": 12580880} {"current_steps": 9630, "total_steps": 12855, "loss": 0.8365, "accuracy": 0.8999999761581421, "learning_rate": 7.370999353735869e-06, "epoch": 0.7491248541423571, "percentage": 74.91, "elapsed_time": "4:22:25", "remaining_time": "1:27:53", "throughput": 799.67, "total_tokens": 12591248} {"current_steps": 9640, "total_steps": 12855, "loss": 1.148, "accuracy": 0.8999999761581421, "learning_rate": 7.327731532037549e-06, "epoch": 0.749902761571373, "percentage": 74.99, "elapsed_time": "4:22:47", "remaining_time": "1:27:38", "throughput": 799.49, "total_tokens": 12606272} {"current_steps": 9650, "total_steps": 12855, "loss": 1.0127, "accuracy": 1.0, "learning_rate": 7.284569257770382e-06, "epoch": 0.750680669000389, "percentage": 75.07, "elapsed_time": "4:23:07", "remaining_time": "1:27:23", "throughput": 799.41, "total_tokens": 12620336} {"current_steps": 9660, "total_steps": 12855, "loss": 0.8315, "accuracy": 0.8999999761581421, "learning_rate": 7.241512788720578e-06, "epoch": 0.751458576429405, "percentage": 75.15, "elapsed_time": "4:23:17", "remaining_time": "1:27:05", "throughput": 799.53, "total_tokens": 12630912} {"current_steps": 9670, "total_steps": 12855, "loss": 0.9609, "accuracy": 0.8999999761581421, "learning_rate": 7.198562382042434e-06, "epoch": 0.7522364838584209, "percentage": 75.22, "elapsed_time": "4:23:35", "remaining_time": "1:26:49", "throughput": 799.51, "total_tokens": 12644560} {"current_steps": 9680, "total_steps": 12855, "loss": 1.0293, "accuracy": 1.0, "learning_rate": 7.155718294256783e-06, "epoch": 0.7530143912874367, "percentage": 75.3, "elapsed_time": "4:23:56", "remaining_time": "1:26:34", "throughput": 799.4, "total_tokens": 12659456} {"current_steps": 9690, "total_steps": 12855, "loss": 1.0017, "accuracy": 0.8999999761581421, "learning_rate": 7.112980781249478e-06, "epoch": 0.7537922987164527, "percentage": 75.38, "elapsed_time": "4:24:09", "remaining_time": "1:26:16", "throughput": 799.41, "total_tokens": 12670160} {"current_steps": 9700, "total_steps": 12855, "loss": 0.8097, "accuracy": 1.0, "learning_rate": 7.070350098269845e-06, "epoch": 0.7545702061454687, "percentage": 75.46, "elapsed_time": "4:24:18", "remaining_time": "1:25:58", "throughput": 799.59, "total_tokens": 12680560} {"current_steps": 9710, "total_steps": 12855, "loss": 0.9539, "accuracy": 0.8999999761581421, "learning_rate": 7.027826499929177e-06, "epoch": 0.7553481135744846, "percentage": 75.53, "elapsed_time": "4:24:36", "remaining_time": "1:25:42", "throughput": 799.59, "total_tokens": 12694608} {"current_steps": 9720, "total_steps": 12855, "loss": 0.8352, "accuracy": 0.8999999761581421, "learning_rate": 6.985410240199203e-06, "epoch": 0.7561260210035006, "percentage": 75.61, "elapsed_time": "4:24:47", "remaining_time": "1:25:24", "throughput": 799.63, "total_tokens": 12704256} {"current_steps": 9730, "total_steps": 12855, "loss": 0.7932, "accuracy": 1.0, "learning_rate": 6.943101572410571e-06, "epoch": 0.7569039284325165, "percentage": 75.69, "elapsed_time": "4:24:57", "remaining_time": "1:25:05", "throughput": 799.72, "total_tokens": 12713744} {"current_steps": 9740, "total_steps": 12855, "loss": 0.7615, "accuracy": 1.0, "learning_rate": 6.900900749251338e-06, "epoch": 0.7576818358615325, "percentage": 75.77, "elapsed_time": "4:25:13", "remaining_time": "1:24:49", "throughput": 799.77, "total_tokens": 12727072} {"current_steps": 9750, "total_steps": 12855, "loss": 0.8872, "accuracy": 0.8999999761581421, "learning_rate": 6.858808022765467e-06, "epoch": 0.7584597432905484, "percentage": 75.85, "elapsed_time": "4:25:27", "remaining_time": "1:24:32", "throughput": 799.73, "total_tokens": 12737776} {"current_steps": 9760, "total_steps": 12855, "loss": 0.7448, "accuracy": 0.800000011920929, "learning_rate": 6.816823644351303e-06, "epoch": 0.7592376507195644, "percentage": 75.92, "elapsed_time": "4:25:40", "remaining_time": "1:24:14", "throughput": 799.81, "total_tokens": 12749344} {"current_steps": 9770, "total_steps": 12855, "loss": 1.1028, "accuracy": 0.8999999761581421, "learning_rate": 6.774947864760089e-06, "epoch": 0.7600155581485804, "percentage": 76.0, "elapsed_time": "4:25:51", "remaining_time": "1:23:56", "throughput": 799.94, "total_tokens": 12760368} {"current_steps": 9780, "total_steps": 12855, "loss": 0.9616, "accuracy": 1.0, "learning_rate": 6.733180934094466e-06, "epoch": 0.7607934655775963, "percentage": 76.08, "elapsed_time": "4:26:12", "remaining_time": "1:23:41", "throughput": 799.87, "total_tokens": 12775856} {"current_steps": 9790, "total_steps": 12855, "loss": 0.9124, "accuracy": 1.0, "learning_rate": 6.691523101806976e-06, "epoch": 0.7615713730066123, "percentage": 76.16, "elapsed_time": "4:26:28", "remaining_time": "1:23:25", "throughput": 800.01, "total_tokens": 12790816} {"current_steps": 9800, "total_steps": 12855, "loss": 1.0583, "accuracy": 0.8999999761581421, "learning_rate": 6.649974616698562e-06, "epoch": 0.7623492804356281, "percentage": 76.23, "elapsed_time": "4:26:41", "remaining_time": "1:23:08", "throughput": 800.08, "total_tokens": 12802160} {"current_steps": 9810, "total_steps": 12855, "loss": 0.7005, "accuracy": 0.8999999761581421, "learning_rate": 6.6085357269171035e-06, "epoch": 0.7631271878646441, "percentage": 76.31, "elapsed_time": "4:26:56", "remaining_time": "1:22:51", "throughput": 800.12, "total_tokens": 12814800} {"current_steps": 9820, "total_steps": 12855, "loss": 0.8859, "accuracy": 0.800000011920929, "learning_rate": 6.567206679955917e-06, "epoch": 0.76390509529366, "percentage": 76.39, "elapsed_time": "4:27:12", "remaining_time": "1:22:35", "throughput": 800.11, "total_tokens": 12827936} {"current_steps": 9830, "total_steps": 12855, "loss": 0.8864, "accuracy": 0.8999999761581421, "learning_rate": 6.525987722652286e-06, "epoch": 0.764683002722676, "percentage": 76.47, "elapsed_time": "4:27:29", "remaining_time": "1:22:19", "throughput": 800.16, "total_tokens": 12842480} {"current_steps": 9840, "total_steps": 12855, "loss": 0.8887, "accuracy": 1.0, "learning_rate": 6.484879101185986e-06, "epoch": 0.7654609101516919, "percentage": 76.55, "elapsed_time": "4:27:47", "remaining_time": "1:22:03", "throughput": 800.2, "total_tokens": 12857024} {"current_steps": 9850, "total_steps": 12855, "loss": 1.0873, "accuracy": 1.0, "learning_rate": 6.443881061077814e-06, "epoch": 0.7662388175807079, "percentage": 76.62, "elapsed_time": "4:28:04", "remaining_time": "1:21:46", "throughput": 800.2, "total_tokens": 12870720} {"current_steps": 9860, "total_steps": 12855, "loss": 0.8442, "accuracy": 1.0, "learning_rate": 6.402993847188113e-06, "epoch": 0.7670167250097238, "percentage": 76.7, "elapsed_time": "4:28:33", "remaining_time": "1:21:34", "throughput": 799.71, "total_tokens": 12886128} {"current_steps": 9870, "total_steps": 12855, "loss": 0.9606, "accuracy": 0.8999999761581421, "learning_rate": 6.3622177037153255e-06, "epoch": 0.7677946324387398, "percentage": 76.78, "elapsed_time": "4:28:57", "remaining_time": "1:21:20", "throughput": 799.51, "total_tokens": 12902208} {"current_steps": 9880, "total_steps": 12855, "loss": 0.8937, "accuracy": 0.8999999761581421, "learning_rate": 6.3215528741945225e-06, "epoch": 0.7685725398677558, "percentage": 76.86, "elapsed_time": "4:29:12", "remaining_time": "1:21:03", "throughput": 799.61, "total_tokens": 12915488} {"current_steps": 9890, "total_steps": 12855, "loss": 0.8059, "accuracy": 1.0, "learning_rate": 6.28099960149596e-06, "epoch": 0.7693504472967717, "percentage": 76.94, "elapsed_time": "4:29:28", "remaining_time": "1:20:47", "throughput": 799.7, "total_tokens": 12929568} {"current_steps": 9900, "total_steps": 12855, "loss": 0.9787, "accuracy": 1.0, "learning_rate": 6.2405581278236145e-06, "epoch": 0.7701283547257877, "percentage": 77.01, "elapsed_time": "4:29:40", "remaining_time": "1:20:29", "throughput": 799.77, "total_tokens": 12940400} {"current_steps": 9910, "total_steps": 12855, "loss": 0.8973, "accuracy": 1.0, "learning_rate": 6.200228694713753e-06, "epoch": 0.7709062621548036, "percentage": 77.09, "elapsed_time": "4:29:57", "remaining_time": "1:20:13", "throughput": 799.83, "total_tokens": 12955424} {"current_steps": 9920, "total_steps": 12855, "loss": 1.1717, "accuracy": 0.6000000238418579, "learning_rate": 6.160011543033467e-06, "epoch": 0.7716841695838196, "percentage": 77.17, "elapsed_time": "4:30:09", "remaining_time": "1:19:55", "throughput": 799.86, "total_tokens": 12965680} {"current_steps": 9930, "total_steps": 12855, "loss": 0.7974, "accuracy": 1.0, "learning_rate": 6.119906912979264e-06, "epoch": 0.7724620770128354, "percentage": 77.25, "elapsed_time": "4:30:20", "remaining_time": "1:19:37", "throughput": 800.05, "total_tokens": 12976944} {"current_steps": 9940, "total_steps": 12855, "loss": 0.8444, "accuracy": 1.0, "learning_rate": 6.0799150440756095e-06, "epoch": 0.7732399844418514, "percentage": 77.32, "elapsed_time": "4:30:41", "remaining_time": "1:19:22", "throughput": 799.96, "total_tokens": 12992592} {"current_steps": 9950, "total_steps": 12855, "loss": 0.8763, "accuracy": 1.0, "learning_rate": 6.040036175173505e-06, "epoch": 0.7740178918708673, "percentage": 77.4, "elapsed_time": "4:30:59", "remaining_time": "1:19:07", "throughput": 800.0, "total_tokens": 13007312} {"current_steps": 9960, "total_steps": 12855, "loss": 0.7542, "accuracy": 1.0, "learning_rate": 6.00027054444906e-06, "epoch": 0.7747957992998833, "percentage": 77.48, "elapsed_time": "4:31:14", "remaining_time": "1:18:50", "throughput": 800.09, "total_tokens": 13020864} {"current_steps": 9970, "total_steps": 12855, "loss": 1.231, "accuracy": 1.0, "learning_rate": 5.960618389402075e-06, "epoch": 0.7755737067288992, "percentage": 77.56, "elapsed_time": "4:31:34", "remaining_time": "1:18:34", "throughput": 799.98, "total_tokens": 13034928} {"current_steps": 9980, "total_steps": 12855, "loss": 0.857, "accuracy": 0.8999999761581421, "learning_rate": 5.92107994685461e-06, "epoch": 0.7763516141579152, "percentage": 77.64, "elapsed_time": "4:31:47", "remaining_time": "1:18:17", "throughput": 800.03, "total_tokens": 13046672} {"current_steps": 9990, "total_steps": 12855, "loss": 0.9055, "accuracy": 1.0, "learning_rate": 5.881655452949583e-06, "epoch": 0.7771295215869312, "percentage": 77.71, "elapsed_time": "4:31:56", "remaining_time": "1:17:59", "throughput": 800.2, "total_tokens": 13056912} {"current_steps": 10000, "total_steps": 12855, "loss": 1.1474, "accuracy": 0.8999999761581421, "learning_rate": 5.842345143149361e-06, "epoch": 0.7779074290159471, "percentage": 77.79, "elapsed_time": "4:32:07", "remaining_time": "1:17:41", "throughput": 800.35, "total_tokens": 13068000} {"current_steps": 10010, "total_steps": 12855, "loss": 1.132, "accuracy": 1.0, "learning_rate": 5.803149252234336e-06, "epoch": 0.7786853364449631, "percentage": 77.87, "elapsed_time": "4:32:32", "remaining_time": "1:17:27", "throughput": 800.07, "total_tokens": 13083008} {"current_steps": 10020, "total_steps": 12855, "loss": 0.7628, "accuracy": 0.8999999761581421, "learning_rate": 5.764068014301538e-06, "epoch": 0.779463243873979, "percentage": 77.95, "elapsed_time": "4:32:41", "remaining_time": "1:17:09", "throughput": 800.09, "total_tokens": 13090528} {"current_steps": 10030, "total_steps": 12855, "loss": 0.8512, "accuracy": 1.0, "learning_rate": 5.7251016627632435e-06, "epoch": 0.780241151302995, "percentage": 78.02, "elapsed_time": "4:33:01", "remaining_time": "1:16:53", "throughput": 800.06, "total_tokens": 13106288} {"current_steps": 10040, "total_steps": 12855, "loss": 0.8928, "accuracy": 0.8999999761581421, "learning_rate": 5.686250430345555e-06, "epoch": 0.7810190587320109, "percentage": 78.1, "elapsed_time": "4:33:20", "remaining_time": "1:16:38", "throughput": 799.96, "total_tokens": 13119776} {"current_steps": 10050, "total_steps": 12855, "loss": 1.0266, "accuracy": 1.0, "learning_rate": 5.647514549087046e-06, "epoch": 0.7817969661610268, "percentage": 78.18, "elapsed_time": "4:33:36", "remaining_time": "1:16:22", "throughput": 799.95, "total_tokens": 13132656} {"current_steps": 10060, "total_steps": 12855, "loss": 0.8212, "accuracy": 1.0, "learning_rate": 5.6088942503373265e-06, "epoch": 0.7825748735900427, "percentage": 78.26, "elapsed_time": "4:33:58", "remaining_time": "1:16:07", "throughput": 799.88, "total_tokens": 13148624} {"current_steps": 10070, "total_steps": 12855, "loss": 0.8577, "accuracy": 1.0, "learning_rate": 5.570389764755729e-06, "epoch": 0.7833527810190587, "percentage": 78.34, "elapsed_time": "4:34:29", "remaining_time": "1:15:54", "throughput": 799.57, "total_tokens": 13168432} {"current_steps": 10080, "total_steps": 12855, "loss": 0.6158, "accuracy": 1.0, "learning_rate": 5.5320013223098684e-06, "epoch": 0.7841306884480747, "percentage": 78.41, "elapsed_time": "4:34:42", "remaining_time": "1:15:37", "throughput": 799.64, "total_tokens": 13179840} {"current_steps": 10090, "total_steps": 12855, "loss": 1.1557, "accuracy": 0.8999999761581421, "learning_rate": 5.493729152274302e-06, "epoch": 0.7849085958770906, "percentage": 78.49, "elapsed_time": "4:35:12", "remaining_time": "1:15:25", "throughput": 799.41, "total_tokens": 13200592} {"current_steps": 10100, "total_steps": 12855, "loss": 0.8677, "accuracy": 1.0, "learning_rate": 5.455573483229143e-06, "epoch": 0.7856865033061066, "percentage": 78.57, "elapsed_time": "4:35:51", "remaining_time": "1:15:14", "throughput": 798.56, "total_tokens": 13217472} {"current_steps": 10110, "total_steps": 12855, "loss": 0.7698, "accuracy": 1.0, "learning_rate": 5.417534543058716e-06, "epoch": 0.7864644107351225, "percentage": 78.65, "elapsed_time": "4:36:12", "remaining_time": "1:14:59", "throughput": 798.5, "total_tokens": 13233008} {"current_steps": 10120, "total_steps": 12855, "loss": 0.9274, "accuracy": 0.800000011920929, "learning_rate": 5.379612558950173e-06, "epoch": 0.7872423181641385, "percentage": 78.72, "elapsed_time": "4:36:38", "remaining_time": "1:14:45", "throughput": 798.34, "total_tokens": 13250944} {"current_steps": 10130, "total_steps": 12855, "loss": 0.7105, "accuracy": 1.0, "learning_rate": 5.341807757392153e-06, "epoch": 0.7880202255931544, "percentage": 78.8, "elapsed_time": "4:36:51", "remaining_time": "1:14:28", "throughput": 798.44, "total_tokens": 13263552} {"current_steps": 10140, "total_steps": 12855, "loss": 0.9119, "accuracy": 1.0, "learning_rate": 5.30412036417342e-06, "epoch": 0.7887981330221704, "percentage": 78.88, "elapsed_time": "4:37:03", "remaining_time": "1:14:11", "throughput": 798.54, "total_tokens": 13274960} {"current_steps": 10150, "total_steps": 12855, "loss": 1.0084, "accuracy": 1.0, "learning_rate": 5.266550604381526e-06, "epoch": 0.7895760404511863, "percentage": 78.96, "elapsed_time": "4:37:21", "remaining_time": "1:13:55", "throughput": 798.51, "total_tokens": 13288768} {"current_steps": 10160, "total_steps": 12855, "loss": 1.0706, "accuracy": 1.0, "learning_rate": 5.229098702401447e-06, "epoch": 0.7903539478802023, "percentage": 79.04, "elapsed_time": "4:37:39", "remaining_time": "1:13:39", "throughput": 798.55, "total_tokens": 13303632} {"current_steps": 10170, "total_steps": 12855, "loss": 1.0391, "accuracy": 1.0, "learning_rate": 5.19176488191426e-06, "epoch": 0.7911318553092183, "percentage": 79.11, "elapsed_time": "4:37:56", "remaining_time": "1:13:22", "throughput": 798.61, "total_tokens": 13317664} {"current_steps": 10180, "total_steps": 12855, "loss": 0.8254, "accuracy": 1.0, "learning_rate": 5.154549365895814e-06, "epoch": 0.7919097627382341, "percentage": 79.19, "elapsed_time": "4:38:18", "remaining_time": "1:13:07", "throughput": 798.55, "total_tokens": 13334128} {"current_steps": 10190, "total_steps": 12855, "loss": 1.2081, "accuracy": 0.8999999761581421, "learning_rate": 5.117452376615345e-06, "epoch": 0.7926876701672501, "percentage": 79.27, "elapsed_time": "4:38:30", "remaining_time": "1:12:50", "throughput": 798.66, "total_tokens": 13346160} {"current_steps": 10200, "total_steps": 12855, "loss": 1.1025, "accuracy": 0.8999999761581421, "learning_rate": 5.0804741356342445e-06, "epoch": 0.793465577596266, "percentage": 79.35, "elapsed_time": "4:38:51", "remaining_time": "1:12:34", "throughput": 798.58, "total_tokens": 13361056} {"current_steps": 10210, "total_steps": 12855, "loss": 1.034, "accuracy": 1.0, "learning_rate": 5.043614863804646e-06, "epoch": 0.794243485025282, "percentage": 79.42, "elapsed_time": "4:39:02", "remaining_time": "1:12:17", "throughput": 798.75, "total_tokens": 13373008} {"current_steps": 10220, "total_steps": 12855, "loss": 0.7596, "accuracy": 0.8999999761581421, "learning_rate": 5.0068747812681505e-06, "epoch": 0.7950213924542979, "percentage": 79.5, "elapsed_time": "4:39:13", "remaining_time": "1:11:59", "throughput": 798.89, "total_tokens": 13383968} {"current_steps": 10230, "total_steps": 12855, "loss": 0.7803, "accuracy": 0.8999999761581421, "learning_rate": 4.970254107454497e-06, "epoch": 0.7957992998833139, "percentage": 79.58, "elapsed_time": "4:39:39", "remaining_time": "1:11:45", "throughput": 798.6, "total_tokens": 13400320} {"current_steps": 10240, "total_steps": 12855, "loss": 1.8045, "accuracy": 0.8999999761581421, "learning_rate": 4.933753061080265e-06, "epoch": 0.7965772073123298, "percentage": 79.66, "elapsed_time": "4:40:17", "remaining_time": "1:11:34", "throughput": 797.93, "total_tokens": 13419232} {"current_steps": 10250, "total_steps": 12855, "loss": 1.1486, "accuracy": 0.8999999761581421, "learning_rate": 4.897371860147556e-06, "epoch": 0.7973551147413458, "percentage": 79.74, "elapsed_time": "4:40:33", "remaining_time": "1:11:18", "throughput": 797.97, "total_tokens": 13432848} {"current_steps": 10260, "total_steps": 12855, "loss": 0.9024, "accuracy": 1.0, "learning_rate": 4.8611107219426996e-06, "epoch": 0.7981330221703618, "percentage": 79.81, "elapsed_time": "4:40:47", "remaining_time": "1:11:01", "throughput": 798.08, "total_tokens": 13445440} {"current_steps": 10270, "total_steps": 12855, "loss": 1.1687, "accuracy": 0.8999999761581421, "learning_rate": 4.824969863034942e-06, "epoch": 0.7989109295993777, "percentage": 79.89, "elapsed_time": "4:41:02", "remaining_time": "1:10:44", "throughput": 798.17, "total_tokens": 13459184} {"current_steps": 10280, "total_steps": 12855, "loss": 0.8515, "accuracy": 1.0, "learning_rate": 4.788949499275177e-06, "epoch": 0.7996888370283937, "percentage": 79.97, "elapsed_time": "4:41:16", "remaining_time": "1:10:27", "throughput": 798.16, "total_tokens": 13470288} {"current_steps": 10290, "total_steps": 12855, "loss": 0.7249, "accuracy": 1.0, "learning_rate": 4.7530498457946325e-06, "epoch": 0.8004667444574096, "percentage": 80.05, "elapsed_time": "4:41:36", "remaining_time": "1:10:11", "throughput": 798.07, "total_tokens": 13484928} {"current_steps": 10300, "total_steps": 12855, "loss": 1.07, "accuracy": 0.800000011920929, "learning_rate": 4.717271117003605e-06, "epoch": 0.8012446518864255, "percentage": 80.12, "elapsed_time": "4:41:47", "remaining_time": "1:09:54", "throughput": 798.15, "total_tokens": 13495120} {"current_steps": 10310, "total_steps": 12855, "loss": 0.8126, "accuracy": 0.8999999761581421, "learning_rate": 4.68161352659015e-06, "epoch": 0.8020225593154414, "percentage": 80.2, "elapsed_time": "4:41:59", "remaining_time": "1:09:36", "throughput": 798.33, "total_tokens": 13506912} {"current_steps": 10320, "total_steps": 12855, "loss": 0.8468, "accuracy": 1.0, "learning_rate": 4.646077287518838e-06, "epoch": 0.8028004667444574, "percentage": 80.28, "elapsed_time": "4:42:10", "remaining_time": "1:09:18", "throughput": 798.34, "total_tokens": 13516128} {"current_steps": 10330, "total_steps": 12855, "loss": 0.8695, "accuracy": 1.0, "learning_rate": 4.610662612029482e-06, "epoch": 0.8035783741734733, "percentage": 80.36, "elapsed_time": "4:42:25", "remaining_time": "1:09:02", "throughput": 798.35, "total_tokens": 13528368} {"current_steps": 10340, "total_steps": 12855, "loss": 0.7204, "accuracy": 1.0, "learning_rate": 4.575369711635843e-06, "epoch": 0.8043562816024893, "percentage": 80.44, "elapsed_time": "4:42:47", "remaining_time": "1:08:46", "throughput": 798.37, "total_tokens": 13545872} {"current_steps": 10350, "total_steps": 12855, "loss": 0.9747, "accuracy": 1.0, "learning_rate": 4.540198797124382e-06, "epoch": 0.8051341890315052, "percentage": 80.51, "elapsed_time": "4:43:07", "remaining_time": "1:08:31", "throughput": 798.37, "total_tokens": 13562416} {"current_steps": 10360, "total_steps": 12855, "loss": 0.9229, "accuracy": 1.0, "learning_rate": 4.5051500785530024e-06, "epoch": 0.8059120964605212, "percentage": 80.59, "elapsed_time": "4:43:28", "remaining_time": "1:08:16", "throughput": 798.38, "total_tokens": 13579456} {"current_steps": 10370, "total_steps": 12855, "loss": 0.7655, "accuracy": 1.0, "learning_rate": 4.470223765249796e-06, "epoch": 0.8066900038895372, "percentage": 80.67, "elapsed_time": "4:43:44", "remaining_time": "1:07:59", "throughput": 798.51, "total_tokens": 13594272} {"current_steps": 10380, "total_steps": 12855, "loss": 0.8874, "accuracy": 0.8999999761581421, "learning_rate": 4.435420065811791e-06, "epoch": 0.8074679113185531, "percentage": 80.75, "elapsed_time": "4:44:03", "remaining_time": "1:07:43", "throughput": 798.58, "total_tokens": 13610336} {"current_steps": 10390, "total_steps": 12855, "loss": 1.0227, "accuracy": 1.0, "learning_rate": 4.4007391881036975e-06, "epoch": 0.8082458187475691, "percentage": 80.82, "elapsed_time": "4:44:16", "remaining_time": "1:07:26", "throughput": 798.68, "total_tokens": 13622880} {"current_steps": 10400, "total_steps": 12855, "loss": 0.9472, "accuracy": 1.0, "learning_rate": 4.3661813392566865e-06, "epoch": 0.809023726176585, "percentage": 80.9, "elapsed_time": "4:44:30", "remaining_time": "1:07:09", "throughput": 798.8, "total_tokens": 13636208} {"current_steps": 10410, "total_steps": 12855, "loss": 0.8132, "accuracy": 1.0, "learning_rate": 4.331746725667132e-06, "epoch": 0.809801633605601, "percentage": 80.98, "elapsed_time": "4:44:43", "remaining_time": "1:06:52", "throughput": 798.94, "total_tokens": 13648832} {"current_steps": 10420, "total_steps": 12855, "loss": 0.9724, "accuracy": 0.8999999761581421, "learning_rate": 4.297435552995391e-06, "epoch": 0.8105795410346169, "percentage": 81.06, "elapsed_time": "4:44:56", "remaining_time": "1:06:35", "throughput": 799.0, "total_tokens": 13659936} {"current_steps": 10430, "total_steps": 12855, "loss": 0.8341, "accuracy": 1.0, "learning_rate": 4.2632480261645705e-06, "epoch": 0.8113574484636328, "percentage": 81.14, "elapsed_time": "4:45:09", "remaining_time": "1:06:17", "throughput": 799.11, "total_tokens": 13672304} {"current_steps": 10440, "total_steps": 12855, "loss": 0.756, "accuracy": 1.0, "learning_rate": 4.229184349359294e-06, "epoch": 0.8121353558926487, "percentage": 81.21, "elapsed_time": "4:45:28", "remaining_time": "1:06:02", "throughput": 799.05, "total_tokens": 13686560} {"current_steps": 10450, "total_steps": 12855, "loss": 0.8569, "accuracy": 0.8999999761581421, "learning_rate": 4.1952447260244995e-06, "epoch": 0.8129132633216647, "percentage": 81.29, "elapsed_time": "4:45:40", "remaining_time": "1:05:44", "throughput": 799.13, "total_tokens": 13697088} {"current_steps": 10460, "total_steps": 12855, "loss": 1.0095, "accuracy": 0.800000011920929, "learning_rate": 4.1614293588642324e-06, "epoch": 0.8136911707506806, "percentage": 81.37, "elapsed_time": "4:45:50", "remaining_time": "1:05:26", "throughput": 799.28, "total_tokens": 13707952} {"current_steps": 10470, "total_steps": 12855, "loss": 0.9935, "accuracy": 0.8999999761581421, "learning_rate": 4.127738449840396e-06, "epoch": 0.8144690781796966, "percentage": 81.45, "elapsed_time": "4:46:04", "remaining_time": "1:05:09", "throughput": 799.36, "total_tokens": 13720752} {"current_steps": 10480, "total_steps": 12855, "loss": 0.7456, "accuracy": 0.8999999761581421, "learning_rate": 4.094172200171578e-06, "epoch": 0.8152469856087126, "percentage": 81.52, "elapsed_time": "4:46:17", "remaining_time": "1:04:52", "throughput": 799.45, "total_tokens": 13732592} {"current_steps": 10490, "total_steps": 12855, "loss": 0.8456, "accuracy": 0.8999999761581421, "learning_rate": 4.060730810331839e-06, "epoch": 0.8160248930377285, "percentage": 81.6, "elapsed_time": "4:46:33", "remaining_time": "1:04:36", "throughput": 799.48, "total_tokens": 13745536} {"current_steps": 10500, "total_steps": 12855, "loss": 0.7924, "accuracy": 0.8999999761581421, "learning_rate": 4.0274144800495216e-06, "epoch": 0.8168028004667445, "percentage": 81.68, "elapsed_time": "4:46:48", "remaining_time": "1:04:19", "throughput": 799.58, "total_tokens": 13759344} {"current_steps": 10510, "total_steps": 12855, "loss": 0.8891, "accuracy": 1.0, "learning_rate": 3.994223408306039e-06, "epoch": 0.8175807078957604, "percentage": 81.76, "elapsed_time": "4:47:01", "remaining_time": "1:04:02", "throughput": 799.69, "total_tokens": 13772224} {"current_steps": 10520, "total_steps": 12855, "loss": 0.7657, "accuracy": 1.0, "learning_rate": 3.961157793334708e-06, "epoch": 0.8183586153247764, "percentage": 81.84, "elapsed_time": "4:47:16", "remaining_time": "1:03:45", "throughput": 799.82, "total_tokens": 13785824} {"current_steps": 10530, "total_steps": 12855, "loss": 0.7805, "accuracy": 1.0, "learning_rate": 3.928217832619555e-06, "epoch": 0.8191365227537923, "percentage": 81.91, "elapsed_time": "4:47:30", "remaining_time": "1:03:28", "throughput": 799.94, "total_tokens": 13799584} {"current_steps": 10540, "total_steps": 12855, "loss": 0.8786, "accuracy": 1.0, "learning_rate": 3.89540372289414e-06, "epoch": 0.8199144301828083, "percentage": 81.99, "elapsed_time": "4:47:50", "remaining_time": "1:03:13", "throughput": 799.94, "total_tokens": 13815536} {"current_steps": 10550, "total_steps": 12855, "loss": 0.8717, "accuracy": 0.8999999761581421, "learning_rate": 3.862715660140376e-06, "epoch": 0.8206923376118241, "percentage": 82.07, "elapsed_time": "4:48:10", "remaining_time": "1:02:57", "throughput": 799.95, "total_tokens": 13831408} {"current_steps": 10560, "total_steps": 12855, "loss": 0.824, "accuracy": 0.8999999761581421, "learning_rate": 3.830153839587352e-06, "epoch": 0.8214702450408401, "percentage": 82.15, "elapsed_time": "4:48:23", "remaining_time": "1:02:40", "throughput": 799.99, "total_tokens": 13842800} {"current_steps": 10570, "total_steps": 12855, "loss": 0.9086, "accuracy": 1.0, "learning_rate": 3.7977184557101975e-06, "epoch": 0.822248152469856, "percentage": 82.22, "elapsed_time": "4:48:43", "remaining_time": "1:02:24", "throughput": 799.98, "total_tokens": 13858096} {"current_steps": 10580, "total_steps": 12855, "loss": 0.9093, "accuracy": 1.0, "learning_rate": 3.765409702228881e-06, "epoch": 0.823026059898872, "percentage": 82.3, "elapsed_time": "4:49:01", "remaining_time": "1:02:08", "throughput": 799.96, "total_tokens": 13872416} {"current_steps": 10590, "total_steps": 12855, "loss": 0.8318, "accuracy": 1.0, "learning_rate": 3.7332277721070925e-06, "epoch": 0.823803967327888, "percentage": 82.38, "elapsed_time": "4:49:13", "remaining_time": "1:01:51", "throughput": 800.01, "total_tokens": 13883168} {"current_steps": 10600, "total_steps": 12855, "loss": 0.7929, "accuracy": 1.0, "learning_rate": 3.7011728575510525e-06, "epoch": 0.8245818747569039, "percentage": 82.46, "elapsed_time": "4:49:29", "remaining_time": "1:01:35", "throughput": 800.1, "total_tokens": 13897536} {"current_steps": 10610, "total_steps": 12855, "loss": 0.936, "accuracy": 0.8999999761581421, "learning_rate": 3.6692451500083908e-06, "epoch": 0.8253597821859199, "percentage": 82.54, "elapsed_time": "4:50:03", "remaining_time": "1:01:22", "throughput": 799.76, "total_tokens": 13918352} {"current_steps": 10620, "total_steps": 12855, "loss": 0.8878, "accuracy": 0.8999999761581421, "learning_rate": 3.6374448401669952e-06, "epoch": 0.8261376896149358, "percentage": 82.61, "elapsed_time": "4:50:22", "remaining_time": "1:01:06", "throughput": 799.81, "total_tokens": 13934352} {"current_steps": 10630, "total_steps": 12855, "loss": 0.9111, "accuracy": 0.8999999761581421, "learning_rate": 3.6057721179538678e-06, "epoch": 0.8269155970439518, "percentage": 82.69, "elapsed_time": "4:50:38", "remaining_time": "1:00:50", "throughput": 799.85, "total_tokens": 13947840} {"current_steps": 10640, "total_steps": 12855, "loss": 3.1668, "accuracy": 1.0, "learning_rate": 3.574227172533995e-06, "epoch": 0.8276935044729677, "percentage": 82.77, "elapsed_time": "4:50:49", "remaining_time": "1:00:32", "throughput": 800.07, "total_tokens": 13960624} {"current_steps": 10650, "total_steps": 12855, "loss": 1.2053, "accuracy": 0.800000011920929, "learning_rate": 3.5428101923092262e-06, "epoch": 0.8284714119019837, "percentage": 82.85, "elapsed_time": "4:51:22", "remaining_time": "1:00:19", "throughput": 799.51, "total_tokens": 13977696} {"current_steps": 10660, "total_steps": 12855, "loss": 0.9772, "accuracy": 0.8999999761581421, "learning_rate": 3.5115213649171306e-06, "epoch": 0.8292493193309997, "percentage": 82.92, "elapsed_time": "4:51:32", "remaining_time": "1:00:01", "throughput": 799.62, "total_tokens": 13987552} {"current_steps": 10670, "total_steps": 12855, "loss": 0.7224, "accuracy": 0.800000011920929, "learning_rate": 3.4803608772298907e-06, "epoch": 0.8300272267600156, "percentage": 83.0, "elapsed_time": "4:51:40", "remaining_time": "0:59:43", "throughput": 799.69, "total_tokens": 13994992} {"current_steps": 10680, "total_steps": 12855, "loss": 0.8346, "accuracy": 1.0, "learning_rate": 3.4493289153531836e-06, "epoch": 0.8308051341890315, "percentage": 83.08, "elapsed_time": "4:51:57", "remaining_time": "0:59:27", "throughput": 799.76, "total_tokens": 14009648} {"current_steps": 10690, "total_steps": 12855, "loss": 0.9122, "accuracy": 0.8999999761581421, "learning_rate": 3.4184256646250524e-06, "epoch": 0.8315830416180474, "percentage": 83.16, "elapsed_time": "4:52:11", "remaining_time": "0:59:10", "throughput": 799.84, "total_tokens": 14022320} {"current_steps": 10700, "total_steps": 12855, "loss": 0.9276, "accuracy": 1.0, "learning_rate": 3.3876513096148338e-06, "epoch": 0.8323609490470634, "percentage": 83.24, "elapsed_time": "4:52:21", "remaining_time": "0:58:52", "throughput": 799.86, "total_tokens": 14031024} {"current_steps": 10710, "total_steps": 12855, "loss": 0.967, "accuracy": 1.0, "learning_rate": 3.3570060341220234e-06, "epoch": 0.8331388564760793, "percentage": 83.31, "elapsed_time": "4:52:41", "remaining_time": "0:58:37", "throughput": 799.85, "total_tokens": 14046720} {"current_steps": 10720, "total_steps": 12855, "loss": 0.7118, "accuracy": 1.0, "learning_rate": 3.326490021175205e-06, "epoch": 0.8339167639050953, "percentage": 83.39, "elapsed_time": "4:53:01", "remaining_time": "0:58:21", "throughput": 799.75, "total_tokens": 14060992} {"current_steps": 10730, "total_steps": 12855, "loss": 0.7835, "accuracy": 1.0, "learning_rate": 3.296103453030927e-06, "epoch": 0.8346946713341112, "percentage": 83.47, "elapsed_time": "4:53:12", "remaining_time": "0:58:04", "throughput": 799.9, "total_tokens": 14072560} {"current_steps": 10740, "total_steps": 12855, "loss": 1.0248, "accuracy": 0.8999999761581421, "learning_rate": 3.2658465111726405e-06, "epoch": 0.8354725787631272, "percentage": 83.55, "elapsed_time": "4:53:30", "remaining_time": "0:57:47", "throughput": 799.82, "total_tokens": 14085216} {"current_steps": 10750, "total_steps": 12855, "loss": 0.8609, "accuracy": 0.800000011920929, "learning_rate": 3.2357193763095984e-06, "epoch": 0.8362504861921431, "percentage": 83.63, "elapsed_time": "4:53:55", "remaining_time": "0:57:33", "throughput": 799.62, "total_tokens": 14102064} {"current_steps": 10760, "total_steps": 12855, "loss": 0.9311, "accuracy": 1.0, "learning_rate": 3.2057222283757877e-06, "epoch": 0.8370283936211591, "percentage": 83.7, "elapsed_time": "4:54:13", "remaining_time": "0:57:17", "throughput": 799.7, "total_tokens": 14117840} {"current_steps": 10770, "total_steps": 12855, "loss": 1.7031, "accuracy": 0.8999999761581421, "learning_rate": 3.175855246528847e-06, "epoch": 0.8378063010501751, "percentage": 83.78, "elapsed_time": "4:54:25", "remaining_time": "0:57:00", "throughput": 799.78, "total_tokens": 14128832} {"current_steps": 10780, "total_steps": 12855, "loss": 0.9301, "accuracy": 0.8999999761581421, "learning_rate": 3.1461186091490015e-06, "epoch": 0.838584208479191, "percentage": 83.86, "elapsed_time": "4:54:41", "remaining_time": "0:56:43", "throughput": 799.88, "total_tokens": 14143392} {"current_steps": 10790, "total_steps": 12855, "loss": 0.7818, "accuracy": 1.0, "learning_rate": 3.1165124938379947e-06, "epoch": 0.839362115908207, "percentage": 83.94, "elapsed_time": "4:54:53", "remaining_time": "0:56:26", "throughput": 799.94, "total_tokens": 14153776} {"current_steps": 10800, "total_steps": 12855, "loss": 1.0033, "accuracy": 1.0, "learning_rate": 3.0870370774180315e-06, "epoch": 0.8401400233372228, "percentage": 84.01, "elapsed_time": "4:55:13", "remaining_time": "0:56:10", "throughput": 799.95, "total_tokens": 14169824} {"current_steps": 10810, "total_steps": 12855, "loss": 0.7738, "accuracy": 0.8999999761581421, "learning_rate": 3.0576925359307063e-06, "epoch": 0.8409179307662388, "percentage": 84.09, "elapsed_time": "4:55:28", "remaining_time": "0:55:53", "throughput": 799.96, "total_tokens": 14181936} {"current_steps": 10820, "total_steps": 12855, "loss": 1.3577, "accuracy": 1.0, "learning_rate": 3.0284790446359817e-06, "epoch": 0.8416958381952547, "percentage": 84.17, "elapsed_time": "4:55:42", "remaining_time": "0:55:36", "throughput": 800.03, "total_tokens": 14194352} {"current_steps": 10830, "total_steps": 12855, "loss": 0.7328, "accuracy": 1.0, "learning_rate": 2.9993967780111126e-06, "epoch": 0.8424737456242707, "percentage": 84.25, "elapsed_time": "4:56:05", "remaining_time": "0:55:21", "throughput": 800.04, "total_tokens": 14213520} {"current_steps": 10840, "total_steps": 12855, "loss": 0.9138, "accuracy": 0.800000011920929, "learning_rate": 2.970445909749614e-06, "epoch": 0.8432516530532866, "percentage": 84.33, "elapsed_time": "4:56:22", "remaining_time": "0:55:05", "throughput": 800.12, "total_tokens": 14228208} {"current_steps": 10850, "total_steps": 12855, "loss": 0.7905, "accuracy": 0.8999999761581421, "learning_rate": 2.9416266127602484e-06, "epoch": 0.8440295604823026, "percentage": 84.4, "elapsed_time": "4:56:45", "remaining_time": "0:54:50", "throughput": 799.98, "total_tokens": 14243744} {"current_steps": 10860, "total_steps": 12855, "loss": 0.9084, "accuracy": 1.0, "learning_rate": 2.9129390591659422e-06, "epoch": 0.8448074679113186, "percentage": 84.48, "elapsed_time": "4:56:56", "remaining_time": "0:54:32", "throughput": 800.02, "total_tokens": 14253184} {"current_steps": 10870, "total_steps": 12855, "loss": 0.786, "accuracy": 0.8999999761581421, "learning_rate": 2.8843834203027997e-06, "epoch": 0.8455853753403345, "percentage": 84.56, "elapsed_time": "4:57:12", "remaining_time": "0:54:16", "throughput": 800.07, "total_tokens": 14267296} {"current_steps": 10880, "total_steps": 12855, "loss": 0.8987, "accuracy": 1.0, "learning_rate": 2.855959866719063e-06, "epoch": 0.8463632827693505, "percentage": 84.64, "elapsed_time": "4:57:21", "remaining_time": "0:53:58", "throughput": 800.19, "total_tokens": 14276864} {"current_steps": 10890, "total_steps": 12855, "loss": 0.9112, "accuracy": 0.8999999761581421, "learning_rate": 2.8276685681740966e-06, "epoch": 0.8471411901983664, "percentage": 84.71, "elapsed_time": "4:57:35", "remaining_time": "0:53:41", "throughput": 800.26, "total_tokens": 14289088} {"current_steps": 10900, "total_steps": 12855, "loss": 0.8632, "accuracy": 1.0, "learning_rate": 2.7995096936373728e-06, "epoch": 0.8479190976273824, "percentage": 84.79, "elapsed_time": "4:57:53", "remaining_time": "0:53:25", "throughput": 800.22, "total_tokens": 14303184} {"current_steps": 10910, "total_steps": 12855, "loss": 1.1989, "accuracy": 1.0, "learning_rate": 2.771483411287462e-06, "epoch": 0.8486970050563983, "percentage": 84.87, "elapsed_time": "4:58:06", "remaining_time": "0:53:08", "throughput": 800.33, "total_tokens": 14314880} {"current_steps": 10920, "total_steps": 12855, "loss": 0.7916, "accuracy": 0.8999999761581421, "learning_rate": 2.7435898885110332e-06, "epoch": 0.8494749124854143, "percentage": 84.95, "elapsed_time": "4:58:17", "remaining_time": "0:52:51", "throughput": 800.4, "total_tokens": 14325008} {"current_steps": 10930, "total_steps": 12855, "loss": 1.8577, "accuracy": 1.0, "learning_rate": 2.715829291901853e-06, "epoch": 0.8502528199144301, "percentage": 85.03, "elapsed_time": "4:58:47", "remaining_time": "0:52:37", "throughput": 800.16, "total_tokens": 14345152} {"current_steps": 10940, "total_steps": 12855, "loss": 0.952, "accuracy": 0.8999999761581421, "learning_rate": 2.6882017872597725e-06, "epoch": 0.8510307273434461, "percentage": 85.1, "elapsed_time": "4:58:59", "remaining_time": "0:52:20", "throughput": 800.23, "total_tokens": 14355328} {"current_steps": 10950, "total_steps": 12855, "loss": 0.8647, "accuracy": 1.0, "learning_rate": 2.660707539589766e-06, "epoch": 0.851808634772462, "percentage": 85.18, "elapsed_time": "4:59:15", "remaining_time": "0:52:03", "throughput": 800.25, "total_tokens": 14369184} {"current_steps": 10960, "total_steps": 12855, "loss": 1.2342, "accuracy": 1.0, "learning_rate": 2.633346713100929e-06, "epoch": 0.852586542201478, "percentage": 85.26, "elapsed_time": "4:59:31", "remaining_time": "0:51:47", "throughput": 800.31, "total_tokens": 14382736} {"current_steps": 10970, "total_steps": 12855, "loss": 0.8513, "accuracy": 0.8999999761581421, "learning_rate": 2.6061194712054927e-06, "epoch": 0.853364449630494, "percentage": 85.34, "elapsed_time": "4:59:45", "remaining_time": "0:51:30", "throughput": 800.38, "total_tokens": 14395296} {"current_steps": 10980, "total_steps": 12855, "loss": 0.8863, "accuracy": 1.0, "learning_rate": 2.5790259765178764e-06, "epoch": 0.8541423570595099, "percentage": 85.41, "elapsed_time": "5:00:05", "remaining_time": "0:51:14", "throughput": 800.29, "total_tokens": 14409472} {"current_steps": 10990, "total_steps": 12855, "loss": 1.0076, "accuracy": 1.0, "learning_rate": 2.55206639085368e-06, "epoch": 0.8549202644885259, "percentage": 85.49, "elapsed_time": "5:00:17", "remaining_time": "0:50:57", "throughput": 800.39, "total_tokens": 14421104} {"current_steps": 11000, "total_steps": 12855, "loss": 1.072, "accuracy": 1.0, "learning_rate": 2.5252408752287295e-06, "epoch": 0.8556981719175418, "percentage": 85.57, "elapsed_time": "5:00:32", "remaining_time": "0:50:40", "throughput": 800.51, "total_tokens": 14435216} {"current_steps": 11010, "total_steps": 12855, "loss": 1.2045, "accuracy": 1.0, "learning_rate": 2.498549589858126e-06, "epoch": 0.8564760793465578, "percentage": 85.65, "elapsed_time": "5:00:48", "remaining_time": "0:50:24", "throughput": 800.37, "total_tokens": 14445648} {"current_steps": 11020, "total_steps": 12855, "loss": 0.9651, "accuracy": 1.0, "learning_rate": 2.471992694155284e-06, "epoch": 0.8572539867755737, "percentage": 85.73, "elapsed_time": "5:01:11", "remaining_time": "0:50:09", "throughput": 800.27, "total_tokens": 14461808} {"current_steps": 11030, "total_steps": 12855, "loss": 1.0341, "accuracy": 0.800000011920929, "learning_rate": 2.4455703467309743e-06, "epoch": 0.8580318942045897, "percentage": 85.8, "elapsed_time": "5:01:28", "remaining_time": "0:49:52", "throughput": 800.27, "total_tokens": 14475792} {"current_steps": 11040, "total_steps": 12855, "loss": 1.0406, "accuracy": 1.0, "learning_rate": 2.4192827053923754e-06, "epoch": 0.8588098016336057, "percentage": 85.88, "elapsed_time": "5:01:53", "remaining_time": "0:49:37", "throughput": 800.13, "total_tokens": 14493312} {"current_steps": 11050, "total_steps": 12855, "loss": 0.7799, "accuracy": 1.0, "learning_rate": 2.3931299271421485e-06, "epoch": 0.8595877090626215, "percentage": 85.96, "elapsed_time": "5:02:08", "remaining_time": "0:49:21", "throughput": 800.22, "total_tokens": 14506896} {"current_steps": 11060, "total_steps": 12855, "loss": 1.0027, "accuracy": 1.0, "learning_rate": 2.3671121681774655e-06, "epoch": 0.8603656164916375, "percentage": 86.04, "elapsed_time": "5:02:23", "remaining_time": "0:49:04", "throughput": 800.21, "total_tokens": 14519024} {"current_steps": 11070, "total_steps": 12855, "loss": 0.8474, "accuracy": 1.0, "learning_rate": 2.3412295838891123e-06, "epoch": 0.8611435239206534, "percentage": 86.11, "elapsed_time": "5:02:46", "remaining_time": "0:48:49", "throughput": 800.25, "total_tokens": 14537424} {"current_steps": 11080, "total_steps": 12855, "loss": 1.0211, "accuracy": 0.8999999761581421, "learning_rate": 2.315482328860544e-06, "epoch": 0.8619214313496694, "percentage": 86.19, "elapsed_time": "5:02:58", "remaining_time": "0:48:32", "throughput": 800.3, "total_tokens": 14548432} {"current_steps": 11090, "total_steps": 12855, "loss": 0.9877, "accuracy": 1.0, "learning_rate": 2.2898705568669605e-06, "epoch": 0.8626993387786853, "percentage": 86.27, "elapsed_time": "5:03:10", "remaining_time": "0:48:15", "throughput": 800.36, "total_tokens": 14558768} {"current_steps": 11100, "total_steps": 12855, "loss": 0.8501, "accuracy": 1.0, "learning_rate": 2.2643944208743912e-06, "epoch": 0.8634772462077013, "percentage": 86.35, "elapsed_time": "5:03:31", "remaining_time": "0:47:59", "throughput": 800.4, "total_tokens": 14576400} {"current_steps": 11110, "total_steps": 12855, "loss": 0.8109, "accuracy": 1.0, "learning_rate": 2.2390540730387768e-06, "epoch": 0.8642551536367172, "percentage": 86.43, "elapsed_time": "5:03:44", "remaining_time": "0:47:42", "throughput": 800.46, "total_tokens": 14587648} {"current_steps": 11120, "total_steps": 12855, "loss": 0.7796, "accuracy": 0.8999999761581421, "learning_rate": 2.2138496647050783e-06, "epoch": 0.8650330610657332, "percentage": 86.5, "elapsed_time": "5:03:55", "remaining_time": "0:47:25", "throughput": 800.44, "total_tokens": 14596320} {"current_steps": 11130, "total_steps": 12855, "loss": 0.8225, "accuracy": 1.0, "learning_rate": 2.1887813464063433e-06, "epoch": 0.8658109684947491, "percentage": 86.58, "elapsed_time": "5:04:09", "remaining_time": "0:47:08", "throughput": 800.57, "total_tokens": 14609632} {"current_steps": 11140, "total_steps": 12855, "loss": 0.8531, "accuracy": 0.800000011920929, "learning_rate": 2.163849267862833e-06, "epoch": 0.8665888759237651, "percentage": 86.66, "elapsed_time": "5:04:32", "remaining_time": "0:46:53", "throughput": 800.26, "total_tokens": 14622960} {"current_steps": 11150, "total_steps": 12855, "loss": 0.9558, "accuracy": 1.0, "learning_rate": 2.139053577981115e-06, "epoch": 0.8673667833527811, "percentage": 86.74, "elapsed_time": "5:04:47", "remaining_time": "0:46:36", "throughput": 800.29, "total_tokens": 14635344} {"current_steps": 11160, "total_steps": 12855, "loss": 0.8762, "accuracy": 1.0, "learning_rate": 2.114394424853178e-06, "epoch": 0.868144690781797, "percentage": 86.81, "elapsed_time": "5:05:01", "remaining_time": "0:46:19", "throughput": 800.4, "total_tokens": 14648704} {"current_steps": 11170, "total_steps": 12855, "loss": 0.8976, "accuracy": 0.800000011920929, "learning_rate": 2.089871955755543e-06, "epoch": 0.868922598210813, "percentage": 86.89, "elapsed_time": "5:05:13", "remaining_time": "0:46:02", "throughput": 800.47, "total_tokens": 14659184} {"current_steps": 11180, "total_steps": 12855, "loss": 0.8291, "accuracy": 0.800000011920929, "learning_rate": 2.065486317148396e-06, "epoch": 0.8697005056398288, "percentage": 86.97, "elapsed_time": "5:05:26", "remaining_time": "0:45:45", "throughput": 800.57, "total_tokens": 14671552} {"current_steps": 11190, "total_steps": 12855, "loss": 0.9947, "accuracy": 1.0, "learning_rate": 2.041237654674691e-06, "epoch": 0.8704784130688448, "percentage": 87.05, "elapsed_time": "5:05:44", "remaining_time": "0:45:29", "throughput": 800.62, "total_tokens": 14686624} {"current_steps": 11200, "total_steps": 12855, "loss": 1.012, "accuracy": 0.8999999761581421, "learning_rate": 2.017126113159301e-06, "epoch": 0.8712563204978607, "percentage": 87.13, "elapsed_time": "5:06:02", "remaining_time": "0:45:13", "throughput": 800.66, "total_tokens": 14702144} {"current_steps": 11210, "total_steps": 12855, "loss": 0.5797, "accuracy": 1.0, "learning_rate": 1.993151836608151e-06, "epoch": 0.8720342279268767, "percentage": 87.2, "elapsed_time": "5:06:19", "remaining_time": "0:44:57", "throughput": 800.63, "total_tokens": 14715008} {"current_steps": 11220, "total_steps": 12855, "loss": 1.1946, "accuracy": 1.0, "learning_rate": 1.9693149682073393e-06, "epoch": 0.8728121353558926, "percentage": 87.28, "elapsed_time": "5:06:34", "remaining_time": "0:44:40", "throughput": 800.6, "total_tokens": 14726608} {"current_steps": 11230, "total_steps": 12855, "loss": 0.9768, "accuracy": 0.8999999761581421, "learning_rate": 1.9456156503223107e-06, "epoch": 0.8735900427849086, "percentage": 87.36, "elapsed_time": "5:06:50", "remaining_time": "0:44:24", "throughput": 800.63, "total_tokens": 14739920} {"current_steps": 11240, "total_steps": 12855, "loss": 1.2682, "accuracy": 1.0, "learning_rate": 1.922054024496975e-06, "epoch": 0.8743679502139245, "percentage": 87.44, "elapsed_time": "5:07:01", "remaining_time": "0:44:06", "throughput": 800.71, "total_tokens": 14750096} {"current_steps": 11250, "total_steps": 12855, "loss": 0.9424, "accuracy": 1.0, "learning_rate": 1.898630231452897e-06, "epoch": 0.8751458576429405, "percentage": 87.51, "elapsed_time": "5:07:14", "remaining_time": "0:43:50", "throughput": 800.78, "total_tokens": 14762112} {"current_steps": 11260, "total_steps": 12855, "loss": 1.0263, "accuracy": 0.8999999761581421, "learning_rate": 1.8753444110884172e-06, "epoch": 0.8759237650719565, "percentage": 87.59, "elapsed_time": "5:07:25", "remaining_time": "0:43:32", "throughput": 800.89, "total_tokens": 14772640} {"current_steps": 11270, "total_steps": 12855, "loss": 0.8807, "accuracy": 1.0, "learning_rate": 1.8521967024778487e-06, "epoch": 0.8767016725009724, "percentage": 87.67, "elapsed_time": "5:07:37", "remaining_time": "0:43:15", "throughput": 800.95, "total_tokens": 14783424} {"current_steps": 11280, "total_steps": 12855, "loss": 0.8601, "accuracy": 0.8999999761581421, "learning_rate": 1.829187243870628e-06, "epoch": 0.8774795799299884, "percentage": 87.75, "elapsed_time": "5:07:54", "remaining_time": "0:42:59", "throughput": 801.0, "total_tokens": 14798224} {"current_steps": 11290, "total_steps": 12855, "loss": 0.8365, "accuracy": 0.800000011920929, "learning_rate": 1.8063161726904976e-06, "epoch": 0.8782574873590043, "percentage": 87.83, "elapsed_time": "5:08:06", "remaining_time": "0:42:42", "throughput": 801.08, "total_tokens": 14809200} {"current_steps": 11300, "total_steps": 12855, "loss": 0.9016, "accuracy": 0.8999999761581421, "learning_rate": 1.783583625534682e-06, "epoch": 0.8790353947880202, "percentage": 87.9, "elapsed_time": "5:08:29", "remaining_time": "0:42:27", "throughput": 801.09, "total_tokens": 14828032} {"current_steps": 11310, "total_steps": 12855, "loss": 0.9042, "accuracy": 1.0, "learning_rate": 1.7609897381730662e-06, "epoch": 0.8798133022170361, "percentage": 87.98, "elapsed_time": "5:08:44", "remaining_time": "0:42:10", "throughput": 801.16, "total_tokens": 14840864} {"current_steps": 11320, "total_steps": 12855, "loss": 0.9976, "accuracy": 0.8999999761581421, "learning_rate": 1.7385346455474016e-06, "epoch": 0.8805912096460521, "percentage": 88.06, "elapsed_time": "5:09:02", "remaining_time": "0:41:54", "throughput": 801.18, "total_tokens": 14855616} {"current_steps": 11330, "total_steps": 12855, "loss": 0.8987, "accuracy": 1.0, "learning_rate": 1.716218481770482e-06, "epoch": 0.881369117075068, "percentage": 88.14, "elapsed_time": "5:09:10", "remaining_time": "0:41:36", "throughput": 801.31, "total_tokens": 14864624} {"current_steps": 11340, "total_steps": 12855, "loss": 0.8339, "accuracy": 0.800000011920929, "learning_rate": 1.6940413801253524e-06, "epoch": 0.882147024504084, "percentage": 88.21, "elapsed_time": "5:09:29", "remaining_time": "0:41:20", "throughput": 801.35, "total_tokens": 14880496} {"current_steps": 11350, "total_steps": 12855, "loss": 1.5936, "accuracy": 1.0, "learning_rate": 1.6720034730645152e-06, "epoch": 0.8829249319331, "percentage": 88.29, "elapsed_time": "5:09:42", "remaining_time": "0:41:03", "throughput": 801.38, "total_tokens": 14891360} {"current_steps": 11360, "total_steps": 12855, "loss": 1.0346, "accuracy": 1.0, "learning_rate": 1.6501048922091255e-06, "epoch": 0.8837028393621159, "percentage": 88.37, "elapsed_time": "5:09:54", "remaining_time": "0:40:47", "throughput": 801.44, "total_tokens": 14902688} {"current_steps": 11370, "total_steps": 12855, "loss": 0.9604, "accuracy": 1.0, "learning_rate": 1.628345768348219e-06, "epoch": 0.8844807467911319, "percentage": 88.45, "elapsed_time": "5:10:08", "remaining_time": "0:40:30", "throughput": 801.53, "total_tokens": 14915024} {"current_steps": 11380, "total_steps": 12855, "loss": 0.9175, "accuracy": 0.8999999761581421, "learning_rate": 1.6067262314379327e-06, "epoch": 0.8852586542201478, "percentage": 88.53, "elapsed_time": "5:10:20", "remaining_time": "0:40:13", "throughput": 801.5, "total_tokens": 14924096} {"current_steps": 11390, "total_steps": 12855, "loss": 0.9809, "accuracy": 1.0, "learning_rate": 1.585246410600713e-06, "epoch": 0.8860365616491638, "percentage": 88.6, "elapsed_time": "5:10:35", "remaining_time": "0:39:56", "throughput": 801.56, "total_tokens": 14937840} {"current_steps": 11400, "total_steps": 12855, "loss": 0.7929, "accuracy": 1.0, "learning_rate": 1.563906434124554e-06, "epoch": 0.8868144690781797, "percentage": 88.68, "elapsed_time": "5:10:48", "remaining_time": "0:39:40", "throughput": 801.66, "total_tokens": 14949600} {"current_steps": 11410, "total_steps": 12855, "loss": 0.7525, "accuracy": 0.8999999761581421, "learning_rate": 1.5427064294622318e-06, "epoch": 0.8875923765071957, "percentage": 88.76, "elapsed_time": "5:11:04", "remaining_time": "0:39:23", "throughput": 801.65, "total_tokens": 14962416} {"current_steps": 11420, "total_steps": 12855, "loss": 0.6949, "accuracy": 0.8999999761581421, "learning_rate": 1.521646523230552e-06, "epoch": 0.8883702839362115, "percentage": 88.84, "elapsed_time": "5:11:18", "remaining_time": "0:39:07", "throughput": 801.69, "total_tokens": 14974592} {"current_steps": 11430, "total_steps": 12855, "loss": 0.9439, "accuracy": 0.8999999761581421, "learning_rate": 1.5007268412095654e-06, "epoch": 0.8891481913652275, "percentage": 88.91, "elapsed_time": "5:11:26", "remaining_time": "0:38:49", "throughput": 801.8, "total_tokens": 14983280} {"current_steps": 11440, "total_steps": 12855, "loss": 0.8139, "accuracy": 1.0, "learning_rate": 1.4799475083418474e-06, "epoch": 0.8899260987942434, "percentage": 88.99, "elapsed_time": "5:11:40", "remaining_time": "0:38:32", "throughput": 801.9, "total_tokens": 14995552} {"current_steps": 11450, "total_steps": 12855, "loss": 0.9004, "accuracy": 1.0, "learning_rate": 1.4593086487317386e-06, "epoch": 0.8907040062232594, "percentage": 89.07, "elapsed_time": "5:11:50", "remaining_time": "0:38:15", "throughput": 802.0, "total_tokens": 15005920} {"current_steps": 11460, "total_steps": 12855, "loss": 0.972, "accuracy": 0.8999999761581421, "learning_rate": 1.4388103856446067e-06, "epoch": 0.8914819136522754, "percentage": 89.15, "elapsed_time": "5:12:04", "remaining_time": "0:37:59", "throughput": 802.11, "total_tokens": 15018672} {"current_steps": 11470, "total_steps": 12855, "loss": 0.9642, "accuracy": 1.0, "learning_rate": 1.4184528415060988e-06, "epoch": 0.8922598210812913, "percentage": 89.23, "elapsed_time": "5:12:16", "remaining_time": "0:37:42", "throughput": 802.19, "total_tokens": 15030528} {"current_steps": 11480, "total_steps": 12855, "loss": 1.1139, "accuracy": 1.0, "learning_rate": 1.3982361379014319e-06, "epoch": 0.8930377285103073, "percentage": 89.3, "elapsed_time": "5:12:28", "remaining_time": "0:37:25", "throughput": 802.31, "total_tokens": 15042128} {"current_steps": 11490, "total_steps": 12855, "loss": 0.6479, "accuracy": 0.8999999761581421, "learning_rate": 1.378160395574643e-06, "epoch": 0.8938156359393232, "percentage": 89.38, "elapsed_time": "5:12:41", "remaining_time": "0:37:08", "throughput": 802.34, "total_tokens": 15053104} {"current_steps": 11500, "total_steps": 12855, "loss": 1.0813, "accuracy": 0.800000011920929, "learning_rate": 1.358225734427887e-06, "epoch": 0.8945935433683392, "percentage": 89.46, "elapsed_time": "5:12:58", "remaining_time": "0:36:52", "throughput": 802.32, "total_tokens": 15066512} {"current_steps": 11510, "total_steps": 12855, "loss": 0.9158, "accuracy": 1.0, "learning_rate": 1.3384322735207123e-06, "epoch": 0.8953714507973551, "percentage": 89.54, "elapsed_time": "5:13:13", "remaining_time": "0:36:36", "throughput": 802.37, "total_tokens": 15079392} {"current_steps": 11520, "total_steps": 12855, "loss": 0.6161, "accuracy": 0.8999999761581421, "learning_rate": 1.318780131069347e-06, "epoch": 0.8961493582263711, "percentage": 89.61, "elapsed_time": "5:13:28", "remaining_time": "0:36:19", "throughput": 802.42, "total_tokens": 15092336} {"current_steps": 11530, "total_steps": 12855, "loss": 0.7547, "accuracy": 1.0, "learning_rate": 1.2992694244460008e-06, "epoch": 0.896927265655387, "percentage": 89.69, "elapsed_time": "5:13:46", "remaining_time": "0:36:03", "throughput": 802.43, "total_tokens": 15107072} {"current_steps": 11540, "total_steps": 12855, "loss": 1.6142, "accuracy": 0.8999999761581421, "learning_rate": 1.2799002701781526e-06, "epoch": 0.897705173084403, "percentage": 89.77, "elapsed_time": "5:14:06", "remaining_time": "0:35:47", "throughput": 802.39, "total_tokens": 15122032} {"current_steps": 11550, "total_steps": 12855, "loss": 0.6518, "accuracy": 1.0, "learning_rate": 1.2606727839478721e-06, "epoch": 0.8984830805134189, "percentage": 89.85, "elapsed_time": "5:14:23", "remaining_time": "0:35:31", "throughput": 802.36, "total_tokens": 15135648} {"current_steps": 11560, "total_steps": 12855, "loss": 0.9793, "accuracy": 0.8999999761581421, "learning_rate": 1.2415870805911056e-06, "epoch": 0.8992609879424348, "percentage": 89.93, "elapsed_time": "5:14:35", "remaining_time": "0:35:14", "throughput": 802.45, "total_tokens": 15146576} {"current_steps": 11570, "total_steps": 12855, "loss": 0.9127, "accuracy": 0.8999999761581421, "learning_rate": 1.2226432740970073e-06, "epoch": 0.9000388953714508, "percentage": 90.0, "elapsed_time": "5:14:49", "remaining_time": "0:34:57", "throughput": 802.59, "total_tokens": 15160624} {"current_steps": 11580, "total_steps": 12855, "loss": 0.9546, "accuracy": 0.8999999761581421, "learning_rate": 1.2038414776072593e-06, "epoch": 0.9008168028004667, "percentage": 90.08, "elapsed_time": "5:15:07", "remaining_time": "0:34:41", "throughput": 802.62, "total_tokens": 15175184} {"current_steps": 11590, "total_steps": 12855, "loss": 1.2083, "accuracy": 0.8999999761581421, "learning_rate": 1.1851818034153833e-06, "epoch": 0.9015947102294827, "percentage": 90.16, "elapsed_time": "5:15:20", "remaining_time": "0:34:25", "throughput": 802.66, "total_tokens": 15186752} {"current_steps": 11600, "total_steps": 12855, "loss": 1.095, "accuracy": 1.0, "learning_rate": 1.1666643629660856e-06, "epoch": 0.9023726176584986, "percentage": 90.24, "elapsed_time": "5:15:31", "remaining_time": "0:34:08", "throughput": 802.73, "total_tokens": 15196896} {"current_steps": 11610, "total_steps": 12855, "loss": 0.7962, "accuracy": 1.0, "learning_rate": 1.1482892668545742e-06, "epoch": 0.9031505250875146, "percentage": 90.32, "elapsed_time": "5:15:48", "remaining_time": "0:33:51", "throughput": 802.71, "total_tokens": 15210464} {"current_steps": 11620, "total_steps": 12855, "loss": 0.8106, "accuracy": 1.0, "learning_rate": 1.1300566248259092e-06, "epoch": 0.9039284325165305, "percentage": 90.39, "elapsed_time": "5:15:57", "remaining_time": "0:33:34", "throughput": 802.84, "total_tokens": 15219536} {"current_steps": 11630, "total_steps": 12855, "loss": 1.8981, "accuracy": 1.0, "learning_rate": 1.1119665457743484e-06, "epoch": 0.9047063399455465, "percentage": 90.47, "elapsed_time": "5:16:07", "remaining_time": "0:33:17", "throughput": 803.03, "total_tokens": 15231792} {"current_steps": 11640, "total_steps": 12855, "loss": 0.7905, "accuracy": 1.0, "learning_rate": 1.0940191377426938e-06, "epoch": 0.9054842473745625, "percentage": 90.55, "elapsed_time": "5:16:19", "remaining_time": "0:33:01", "throughput": 803.09, "total_tokens": 15242496} {"current_steps": 11650, "total_steps": 12855, "loss": 0.917, "accuracy": 1.0, "learning_rate": 1.076214507921644e-06, "epoch": 0.9062621548035784, "percentage": 90.63, "elapsed_time": "5:16:37", "remaining_time": "0:32:45", "throughput": 803.07, "total_tokens": 15256656} {"current_steps": 11660, "total_steps": 12855, "loss": 0.9742, "accuracy": 1.0, "learning_rate": 1.0585527626491564e-06, "epoch": 0.9070400622325944, "percentage": 90.7, "elapsed_time": "5:17:03", "remaining_time": "0:32:29", "throughput": 802.9, "total_tokens": 15273632} {"current_steps": 11670, "total_steps": 12855, "loss": 0.8336, "accuracy": 0.8999999761581421, "learning_rate": 1.0410340074098162e-06, "epoch": 0.9078179696616102, "percentage": 90.78, "elapsed_time": "5:17:15", "remaining_time": "0:32:12", "throughput": 803.0, "total_tokens": 15285872} {"current_steps": 11680, "total_steps": 12855, "loss": 0.9522, "accuracy": 1.0, "learning_rate": 1.0236583468341914e-06, "epoch": 0.9085958770906262, "percentage": 90.86, "elapsed_time": "5:17:30", "remaining_time": "0:31:56", "throughput": 803.03, "total_tokens": 15298096} {"current_steps": 11690, "total_steps": 12855, "loss": 1.1176, "accuracy": 0.8999999761581421, "learning_rate": 1.0064258846982282e-06, "epoch": 0.9093737845196421, "percentage": 90.94, "elapsed_time": "5:17:41", "remaining_time": "0:31:39", "throughput": 803.08, "total_tokens": 15307776} {"current_steps": 11700, "total_steps": 12855, "loss": 0.9805, "accuracy": 0.8999999761581421, "learning_rate": 9.893367239226208e-07, "epoch": 0.9101516919486581, "percentage": 91.02, "elapsed_time": "5:17:54", "remaining_time": "0:31:23", "throughput": 803.18, "total_tokens": 15320480} {"current_steps": 11710, "total_steps": 12855, "loss": 0.6806, "accuracy": 1.0, "learning_rate": 9.723909665721954e-07, "epoch": 0.910929599377674, "percentage": 91.09, "elapsed_time": "5:18:01", "remaining_time": "0:31:05", "throughput": 803.34, "total_tokens": 15329120} {"current_steps": 11720, "total_steps": 12855, "loss": 0.919, "accuracy": 0.8999999761581421, "learning_rate": 9.555887138553015e-07, "epoch": 0.91170750680669, "percentage": 91.17, "elapsed_time": "5:18:15", "remaining_time": "0:30:49", "throughput": 803.41, "total_tokens": 15341536} {"current_steps": 11730, "total_steps": 12855, "loss": 0.7633, "accuracy": 1.0, "learning_rate": 9.389300661232142e-07, "epoch": 0.912485414235706, "percentage": 91.25, "elapsed_time": "5:18:25", "remaining_time": "0:30:32", "throughput": 803.53, "total_tokens": 15351520} {"current_steps": 11740, "total_steps": 12855, "loss": 0.9022, "accuracy": 1.0, "learning_rate": 9.224151228695216e-07, "epoch": 0.9132633216647219, "percentage": 91.33, "elapsed_time": "5:18:59", "remaining_time": "0:30:17", "throughput": 803.1, "total_tokens": 15370992} {"current_steps": 11750, "total_steps": 12855, "loss": 0.8075, "accuracy": 1.0, "learning_rate": 9.060439827295486e-07, "epoch": 0.9140412290937379, "percentage": 91.4, "elapsed_time": "5:19:18", "remaining_time": "0:30:01", "throughput": 803.09, "total_tokens": 15386080} {"current_steps": 11760, "total_steps": 12855, "loss": 1.1229, "accuracy": 1.0, "learning_rate": 8.898167434797433e-07, "epoch": 0.9148191365227538, "percentage": 91.48, "elapsed_time": "5:19:34", "remaining_time": "0:29:45", "throughput": 803.1, "total_tokens": 15399072} {"current_steps": 11770, "total_steps": 12855, "loss": 0.7756, "accuracy": 1.0, "learning_rate": 8.737335020371218e-07, "epoch": 0.9155970439517698, "percentage": 91.56, "elapsed_time": "5:19:48", "remaining_time": "0:29:28", "throughput": 803.18, "total_tokens": 15412064} {"current_steps": 11780, "total_steps": 12855, "loss": 0.9682, "accuracy": 0.8999999761581421, "learning_rate": 8.577943544586686e-07, "epoch": 0.9163749513807857, "percentage": 91.64, "elapsed_time": "5:19:58", "remaining_time": "0:29:11", "throughput": 803.25, "total_tokens": 15420832} {"current_steps": 11790, "total_steps": 12855, "loss": 0.7964, "accuracy": 1.0, "learning_rate": 8.419993959407652e-07, "epoch": 0.9171528588098017, "percentage": 91.72, "elapsed_time": "5:20:15", "remaining_time": "0:28:55", "throughput": 803.19, "total_tokens": 15434000} {"current_steps": 11800, "total_steps": 12855, "loss": 0.7813, "accuracy": 1.0, "learning_rate": 8.263487208186372e-07, "epoch": 0.9179307662388175, "percentage": 91.79, "elapsed_time": "5:20:34", "remaining_time": "0:28:39", "throughput": 803.14, "total_tokens": 15447920} {"current_steps": 11810, "total_steps": 12855, "loss": 0.6235, "accuracy": 1.0, "learning_rate": 8.108424225657635e-07, "epoch": 0.9187086736678335, "percentage": 91.87, "elapsed_time": "5:20:44", "remaining_time": "0:28:22", "throughput": 803.28, "total_tokens": 15458496} {"current_steps": 11820, "total_steps": 12855, "loss": 0.9534, "accuracy": 1.0, "learning_rate": 7.954805937933435e-07, "epoch": 0.9194865810968494, "percentage": 91.95, "elapsed_time": "5:20:59", "remaining_time": "0:28:06", "throughput": 803.34, "total_tokens": 15471504} {"current_steps": 11830, "total_steps": 12855, "loss": 0.8795, "accuracy": 1.0, "learning_rate": 7.802633262497333e-07, "epoch": 0.9202644885258654, "percentage": 92.03, "elapsed_time": "5:21:11", "remaining_time": "0:27:49", "throughput": 803.44, "total_tokens": 15483184} {"current_steps": 11840, "total_steps": 12855, "loss": 1.4278, "accuracy": 0.8999999761581421, "learning_rate": 7.651907108198992e-07, "epoch": 0.9210423959548814, "percentage": 92.1, "elapsed_time": "5:21:23", "remaining_time": "0:27:33", "throughput": 803.55, "total_tokens": 15495376} {"current_steps": 11850, "total_steps": 12855, "loss": 0.9122, "accuracy": 1.0, "learning_rate": 7.502628375248704e-07, "epoch": 0.9218203033838973, "percentage": 92.18, "elapsed_time": "5:21:40", "remaining_time": "0:27:16", "throughput": 803.62, "total_tokens": 15510192} {"current_steps": 11860, "total_steps": 12855, "loss": 0.937, "accuracy": 1.0, "learning_rate": 7.354797955212073e-07, "epoch": 0.9225982108129133, "percentage": 92.26, "elapsed_time": "5:21:55", "remaining_time": "0:27:00", "throughput": 803.63, "total_tokens": 15522240} {"current_steps": 11870, "total_steps": 12855, "loss": 0.9866, "accuracy": 0.8999999761581421, "learning_rate": 7.208416731004724e-07, "epoch": 0.9233761182419292, "percentage": 92.34, "elapsed_time": "5:22:11", "remaining_time": "0:26:44", "throughput": 803.72, "total_tokens": 15537056} {"current_steps": 11880, "total_steps": 12855, "loss": 0.8228, "accuracy": 1.0, "learning_rate": 7.063485576886852e-07, "epoch": 0.9241540256709452, "percentage": 92.42, "elapsed_time": "5:22:22", "remaining_time": "0:26:27", "throughput": 803.83, "total_tokens": 15548384} {"current_steps": 11890, "total_steps": 12855, "loss": 1.116, "accuracy": 1.0, "learning_rate": 6.920005358458243e-07, "epoch": 0.9249319330999611, "percentage": 92.49, "elapsed_time": "5:22:42", "remaining_time": "0:26:11", "throughput": 803.76, "total_tokens": 15562736} {"current_steps": 11900, "total_steps": 12855, "loss": 1.0268, "accuracy": 1.0, "learning_rate": 6.777976932652946e-07, "epoch": 0.9257098405289771, "percentage": 92.57, "elapsed_time": "5:23:01", "remaining_time": "0:25:55", "throughput": 803.8, "total_tokens": 15578576} {"current_steps": 11910, "total_steps": 12855, "loss": 0.9288, "accuracy": 1.0, "learning_rate": 6.637401147734173e-07, "epoch": 0.926487747957993, "percentage": 92.65, "elapsed_time": "5:23:16", "remaining_time": "0:25:38", "throughput": 803.87, "total_tokens": 15592032} {"current_steps": 11920, "total_steps": 12855, "loss": 1.0104, "accuracy": 1.0, "learning_rate": 6.498278843289324e-07, "epoch": 0.9272656553870089, "percentage": 92.73, "elapsed_time": "5:23:31", "remaining_time": "0:25:22", "throughput": 803.87, "total_tokens": 15604512} {"current_steps": 11930, "total_steps": 12855, "loss": 1.1551, "accuracy": 1.0, "learning_rate": 6.360610850224741e-07, "epoch": 0.9280435628160248, "percentage": 92.8, "elapsed_time": "5:23:50", "remaining_time": "0:25:06", "throughput": 803.9, "total_tokens": 15620544} {"current_steps": 11940, "total_steps": 12855, "loss": 0.8369, "accuracy": 1.0, "learning_rate": 6.224397990761105e-07, "epoch": 0.9288214702450408, "percentage": 92.88, "elapsed_time": "5:24:13", "remaining_time": "0:24:50", "throughput": 803.87, "total_tokens": 15638288} {"current_steps": 11950, "total_steps": 12855, "loss": 0.935, "accuracy": 0.8999999761581421, "learning_rate": 6.089641078428188e-07, "epoch": 0.9295993776740568, "percentage": 92.96, "elapsed_time": "5:24:26", "remaining_time": "0:24:34", "throughput": 803.95, "total_tokens": 15650016} {"current_steps": 11960, "total_steps": 12855, "loss": 0.7011, "accuracy": 1.0, "learning_rate": 5.956340918060188e-07, "epoch": 0.9303772851030727, "percentage": 93.04, "elapsed_time": "5:24:44", "remaining_time": "0:24:18", "throughput": 803.96, "total_tokens": 15664480} {"current_steps": 11970, "total_steps": 12855, "loss": 0.9359, "accuracy": 1.0, "learning_rate": 5.824498305790904e-07, "epoch": 0.9311551925320887, "percentage": 93.12, "elapsed_time": "5:25:00", "remaining_time": "0:24:01", "throughput": 803.99, "total_tokens": 15678096} {"current_steps": 11980, "total_steps": 12855, "loss": 0.7642, "accuracy": 0.8999999761581421, "learning_rate": 5.694114029048847e-07, "epoch": 0.9319330999611046, "percentage": 93.19, "elapsed_time": "5:25:09", "remaining_time": "0:23:44", "throughput": 804.09, "total_tokens": 15687184} {"current_steps": 11990, "total_steps": 12855, "loss": 1.1732, "accuracy": 1.0, "learning_rate": 5.565188866552718e-07, "epoch": 0.9327110073901206, "percentage": 93.27, "elapsed_time": "5:25:31", "remaining_time": "0:23:29", "throughput": 804.0, "total_tokens": 15703504} {"current_steps": 12000, "total_steps": 12855, "loss": 1.2573, "accuracy": 0.800000011920929, "learning_rate": 5.437723588306659e-07, "epoch": 0.9334889148191365, "percentage": 93.35, "elapsed_time": "5:25:53", "remaining_time": "0:23:13", "throughput": 803.97, "total_tokens": 15720608} {"current_steps": 12010, "total_steps": 12855, "loss": 0.9168, "accuracy": 0.8999999761581421, "learning_rate": 5.311718955595651e-07, "epoch": 0.9342668222481525, "percentage": 93.43, "elapsed_time": "5:26:14", "remaining_time": "0:22:57", "throughput": 803.84, "total_tokens": 15734576} {"current_steps": 12020, "total_steps": 12855, "loss": 0.6628, "accuracy": 1.0, "learning_rate": 5.187175720980957e-07, "epoch": 0.9350447296771685, "percentage": 93.5, "elapsed_time": "5:26:34", "remaining_time": "0:22:41", "throughput": 803.8, "total_tokens": 15750064} {"current_steps": 12030, "total_steps": 12855, "loss": 1.0443, "accuracy": 1.0, "learning_rate": 5.064094628295741e-07, "epoch": 0.9358226371061844, "percentage": 93.58, "elapsed_time": "5:26:57", "remaining_time": "0:22:25", "throughput": 803.69, "total_tokens": 15765904} {"current_steps": 12040, "total_steps": 12855, "loss": 0.9946, "accuracy": 0.8999999761581421, "learning_rate": 4.942476412640479e-07, "epoch": 0.9366005445352004, "percentage": 93.66, "elapsed_time": "5:27:16", "remaining_time": "0:22:09", "throughput": 803.64, "total_tokens": 15780736} {"current_steps": 12050, "total_steps": 12855, "loss": 0.9204, "accuracy": 1.0, "learning_rate": 4.822321800378643e-07, "epoch": 0.9373784519642162, "percentage": 93.74, "elapsed_time": "5:27:31", "remaining_time": "0:21:52", "throughput": 803.75, "total_tokens": 15794608} {"current_steps": 12060, "total_steps": 12855, "loss": 1.0583, "accuracy": 0.8999999761581421, "learning_rate": 4.7036315091323337e-07, "epoch": 0.9381563593932322, "percentage": 93.82, "elapsed_time": "5:27:44", "remaining_time": "0:21:36", "throughput": 803.82, "total_tokens": 15806912} {"current_steps": 12070, "total_steps": 12855, "loss": 1.5365, "accuracy": 1.0, "learning_rate": 4.586406247778008e-07, "epoch": 0.9389342668222481, "percentage": 93.89, "elapsed_time": "5:28:04", "remaining_time": "0:21:20", "throughput": 803.77, "total_tokens": 15822048} {"current_steps": 12080, "total_steps": 12855, "loss": 0.7322, "accuracy": 0.8999999761581421, "learning_rate": 4.4706467164422894e-07, "epoch": 0.9397121742512641, "percentage": 93.97, "elapsed_time": "5:28:24", "remaining_time": "0:21:04", "throughput": 803.78, "total_tokens": 15838416} {"current_steps": 12090, "total_steps": 12855, "loss": 0.9799, "accuracy": 0.8999999761581421, "learning_rate": 4.356353606497693e-07, "epoch": 0.94049008168028, "percentage": 94.05, "elapsed_time": "5:28:44", "remaining_time": "0:20:48", "throughput": 803.79, "total_tokens": 15854096} {"current_steps": 12100, "total_steps": 12855, "loss": 0.991, "accuracy": 1.0, "learning_rate": 4.2435276005586e-07, "epoch": 0.941267989109296, "percentage": 94.13, "elapsed_time": "5:28:59", "remaining_time": "0:20:31", "throughput": 803.84, "total_tokens": 15867280} {"current_steps": 12110, "total_steps": 12855, "loss": 0.9771, "accuracy": 0.8999999761581421, "learning_rate": 4.132169372477124e-07, "epoch": 0.9420458965383119, "percentage": 94.2, "elapsed_time": "5:29:18", "remaining_time": "0:20:15", "throughput": 803.7, "total_tokens": 15879712} {"current_steps": 12120, "total_steps": 12855, "loss": 0.7652, "accuracy": 0.8999999761581421, "learning_rate": 4.0222795873390283e-07, "epoch": 0.9428238039673279, "percentage": 94.28, "elapsed_time": "5:29:31", "remaining_time": "0:19:59", "throughput": 803.75, "total_tokens": 15891616} {"current_steps": 12130, "total_steps": 12855, "loss": 0.9324, "accuracy": 0.8999999761581421, "learning_rate": 3.9138589014598717e-07, "epoch": 0.9436017113963439, "percentage": 94.36, "elapsed_time": "5:29:46", "remaining_time": "0:19:42", "throughput": 803.79, "total_tokens": 15904240} {"current_steps": 12140, "total_steps": 12855, "loss": 0.9589, "accuracy": 1.0, "learning_rate": 3.806907962381007e-07, "epoch": 0.9443796188253598, "percentage": 94.44, "elapsed_time": "5:29:57", "remaining_time": "0:19:25", "throughput": 803.91, "total_tokens": 15915312} {"current_steps": 12150, "total_steps": 12855, "loss": 0.7232, "accuracy": 1.0, "learning_rate": 3.701427408865782e-07, "epoch": 0.9451575262543758, "percentage": 94.52, "elapsed_time": "5:30:17", "remaining_time": "0:19:09", "throughput": 803.85, "total_tokens": 15929984} {"current_steps": 12160, "total_steps": 12855, "loss": 0.9622, "accuracy": 1.0, "learning_rate": 3.597417870895653e-07, "epoch": 0.9459354336833917, "percentage": 94.59, "elapsed_time": "5:30:35", "remaining_time": "0:18:53", "throughput": 803.89, "total_tokens": 15945424} {"current_steps": 12170, "total_steps": 12855, "loss": 0.9803, "accuracy": 0.8999999761581421, "learning_rate": 3.494879969666437e-07, "epoch": 0.9467133411124076, "percentage": 94.67, "elapsed_time": "5:30:50", "remaining_time": "0:18:37", "throughput": 803.83, "total_tokens": 15956768} {"current_steps": 12180, "total_steps": 12855, "loss": 1.0365, "accuracy": 1.0, "learning_rate": 3.393814317584648e-07, "epoch": 0.9474912485414235, "percentage": 94.75, "elapsed_time": "5:31:04", "remaining_time": "0:18:20", "throughput": 803.92, "total_tokens": 15969616} {"current_steps": 12190, "total_steps": 12855, "loss": 0.841, "accuracy": 1.0, "learning_rate": 3.294221518263779e-07, "epoch": 0.9482691559704395, "percentage": 94.83, "elapsed_time": "5:31:19", "remaining_time": "0:18:04", "throughput": 803.99, "total_tokens": 15983360} {"current_steps": 12200, "total_steps": 12855, "loss": 1.1184, "accuracy": 0.8999999761581421, "learning_rate": 3.196102166520776e-07, "epoch": 0.9490470633994554, "percentage": 94.9, "elapsed_time": "5:31:33", "remaining_time": "0:17:48", "throughput": 804.03, "total_tokens": 15995120} {"current_steps": 12210, "total_steps": 12855, "loss": 0.7673, "accuracy": 1.0, "learning_rate": 3.0994568483723453e-07, "epoch": 0.9498249708284714, "percentage": 94.98, "elapsed_time": "5:31:45", "remaining_time": "0:17:31", "throughput": 804.08, "total_tokens": 16005920} {"current_steps": 12220, "total_steps": 12855, "loss": 0.9459, "accuracy": 0.8999999761581421, "learning_rate": 3.004286141031626e-07, "epoch": 0.9506028782574873, "percentage": 95.06, "elapsed_time": "5:32:01", "remaining_time": "0:17:15", "throughput": 804.13, "total_tokens": 16019360} {"current_steps": 12230, "total_steps": 12855, "loss": 0.834, "accuracy": 0.8999999761581421, "learning_rate": 2.910590612904635e-07, "epoch": 0.9513807856865033, "percentage": 95.14, "elapsed_time": "5:32:12", "remaining_time": "0:16:58", "throughput": 804.18, "total_tokens": 16029104} {"current_steps": 12240, "total_steps": 12855, "loss": 0.9304, "accuracy": 1.0, "learning_rate": 2.81837082358688e-07, "epoch": 0.9521586931155193, "percentage": 95.22, "elapsed_time": "5:32:29", "remaining_time": "0:16:42", "throughput": 804.2, "total_tokens": 16043568} {"current_steps": 12250, "total_steps": 12855, "loss": 0.9775, "accuracy": 0.8999999761581421, "learning_rate": 2.72762732386006e-07, "epoch": 0.9529366005445352, "percentage": 95.29, "elapsed_time": "5:32:45", "remaining_time": "0:16:26", "throughput": 804.26, "total_tokens": 16057312} {"current_steps": 12260, "total_steps": 12855, "loss": 0.8093, "accuracy": 0.800000011920929, "learning_rate": 2.63836065568876e-07, "epoch": 0.9537145079735512, "percentage": 95.37, "elapsed_time": "5:32:59", "remaining_time": "0:16:09", "throughput": 804.23, "total_tokens": 16068064} {"current_steps": 12270, "total_steps": 12855, "loss": 1.0088, "accuracy": 1.0, "learning_rate": 2.5505713522171457e-07, "epoch": 0.9544924154025671, "percentage": 95.45, "elapsed_time": "5:33:15", "remaining_time": "0:15:53", "throughput": 804.17, "total_tokens": 16080032} {"current_steps": 12280, "total_steps": 12855, "loss": 0.9232, "accuracy": 1.0, "learning_rate": 2.464259937765889e-07, "epoch": 0.9552703228315831, "percentage": 95.53, "elapsed_time": "5:33:25", "remaining_time": "0:15:36", "throughput": 804.29, "total_tokens": 16090400} {"current_steps": 12290, "total_steps": 12855, "loss": 0.8555, "accuracy": 1.0, "learning_rate": 2.3794269278289982e-07, "epoch": 0.956048230260599, "percentage": 95.6, "elapsed_time": "5:33:38", "remaining_time": "0:15:20", "throughput": 804.31, "total_tokens": 16101152} {"current_steps": 12300, "total_steps": 12855, "loss": 1.2045, "accuracy": 1.0, "learning_rate": 2.2960728290706836e-07, "epoch": 0.9568261376896149, "percentage": 95.68, "elapsed_time": "5:33:55", "remaining_time": "0:15:04", "throughput": 804.3, "total_tokens": 16114400} {"current_steps": 12310, "total_steps": 12855, "loss": 1.3834, "accuracy": 0.8999999761581421, "learning_rate": 2.2141981393223876e-07, "epoch": 0.9576040451186308, "percentage": 95.76, "elapsed_time": "5:34:06", "remaining_time": "0:14:47", "throughput": 804.38, "total_tokens": 16124784} {"current_steps": 12320, "total_steps": 12855, "loss": 1.0797, "accuracy": 0.8999999761581421, "learning_rate": 2.1338033475798158e-07, "epoch": 0.9583819525476468, "percentage": 95.84, "elapsed_time": "5:34:21", "remaining_time": "0:14:31", "throughput": 804.42, "total_tokens": 16137648} {"current_steps": 12330, "total_steps": 12855, "loss": 0.8836, "accuracy": 1.0, "learning_rate": 2.0548889339999654e-07, "epoch": 0.9591598599766628, "percentage": 95.92, "elapsed_time": "5:34:35", "remaining_time": "0:14:14", "throughput": 804.46, "total_tokens": 16150128} {"current_steps": 12340, "total_steps": 12855, "loss": 0.7582, "accuracy": 1.0, "learning_rate": 1.9774553698983512e-07, "epoch": 0.9599377674056787, "percentage": 95.99, "elapsed_time": "5:34:47", "remaining_time": "0:13:58", "throughput": 804.52, "total_tokens": 16160560} {"current_steps": 12350, "total_steps": 12855, "loss": 0.9609, "accuracy": 1.0, "learning_rate": 1.9015031177460619e-07, "epoch": 0.9607156748346947, "percentage": 96.07, "elapsed_time": "5:35:07", "remaining_time": "0:13:42", "throughput": 804.45, "total_tokens": 16175728} {"current_steps": 12360, "total_steps": 12855, "loss": 0.9568, "accuracy": 0.800000011920929, "learning_rate": 1.827032631167097e-07, "epoch": 0.9614935822637106, "percentage": 96.15, "elapsed_time": "5:35:20", "remaining_time": "0:13:25", "throughput": 804.55, "total_tokens": 16187920} {"current_steps": 12370, "total_steps": 12855, "loss": 0.859, "accuracy": 0.8999999761581421, "learning_rate": 1.7540443549356188e-07, "epoch": 0.9622714896927266, "percentage": 96.23, "elapsed_time": "5:35:38", "remaining_time": "0:13:09", "throughput": 804.52, "total_tokens": 16201888} {"current_steps": 12380, "total_steps": 12855, "loss": 0.7037, "accuracy": 0.8999999761581421, "learning_rate": 1.6825387249733704e-07, "epoch": 0.9630493971217425, "percentage": 96.3, "elapsed_time": "5:35:51", "remaining_time": "0:12:53", "throughput": 804.62, "total_tokens": 16214576} {"current_steps": 12390, "total_steps": 12855, "loss": 1.4037, "accuracy": 1.0, "learning_rate": 1.6125161683468726e-07, "epoch": 0.9638273045507585, "percentage": 96.38, "elapsed_time": "5:36:01", "remaining_time": "0:12:36", "throughput": 804.79, "total_tokens": 16225616} {"current_steps": 12400, "total_steps": 12855, "loss": 0.8089, "accuracy": 0.8999999761581421, "learning_rate": 1.5439771032651485e-07, "epoch": 0.9646052119797744, "percentage": 96.46, "elapsed_time": "5:36:15", "remaining_time": "0:12:20", "throughput": 804.87, "total_tokens": 16238272} {"current_steps": 12410, "total_steps": 12855, "loss": 0.9533, "accuracy": 0.699999988079071, "learning_rate": 1.476921939076975e-07, "epoch": 0.9653831194087904, "percentage": 96.54, "elapsed_time": "5:36:27", "remaining_time": "0:12:03", "throughput": 804.92, "total_tokens": 16249104} {"current_steps": 12420, "total_steps": 12855, "loss": 0.8506, "accuracy": 1.0, "learning_rate": 1.41135107626858e-07, "epoch": 0.9661610268378062, "percentage": 96.62, "elapsed_time": "5:36:38", "remaining_time": "0:11:47", "throughput": 805.0, "total_tokens": 16259392} {"current_steps": 12430, "total_steps": 12855, "loss": 0.8505, "accuracy": 0.800000011920929, "learning_rate": 1.3472649064612818e-07, "epoch": 0.9669389342668222, "percentage": 96.69, "elapsed_time": "5:36:49", "remaining_time": "0:11:30", "throughput": 805.08, "total_tokens": 16270256} {"current_steps": 12440, "total_steps": 12855, "loss": 0.7486, "accuracy": 0.8999999761581421, "learning_rate": 1.2846638124089928e-07, "epoch": 0.9677168416958382, "percentage": 96.77, "elapsed_time": "5:36:59", "remaining_time": "0:11:14", "throughput": 805.15, "total_tokens": 16280016} {"current_steps": 12450, "total_steps": 12855, "loss": 0.9589, "accuracy": 1.0, "learning_rate": 1.2235481679960803e-07, "epoch": 0.9684947491248541, "percentage": 96.85, "elapsed_time": "5:37:16", "remaining_time": "0:10:58", "throughput": 805.22, "total_tokens": 16295184} {"current_steps": 12460, "total_steps": 12855, "loss": 1.1484, "accuracy": 0.8999999761581421, "learning_rate": 1.1639183382350649e-07, "epoch": 0.9692726565538701, "percentage": 96.93, "elapsed_time": "5:37:31", "remaining_time": "0:10:42", "throughput": 805.25, "total_tokens": 16307840} {"current_steps": 12470, "total_steps": 12855, "loss": 0.8724, "accuracy": 0.8999999761581421, "learning_rate": 1.1057746792644541e-07, "epoch": 0.970050563982886, "percentage": 97.01, "elapsed_time": "5:37:40", "remaining_time": "0:10:25", "throughput": 805.46, "total_tokens": 16319312} {"current_steps": 12480, "total_steps": 12855, "loss": 0.9361, "accuracy": 1.0, "learning_rate": 1.0491175383466056e-07, "epoch": 0.970828471411902, "percentage": 97.08, "elapsed_time": "5:37:57", "remaining_time": "0:10:09", "throughput": 805.48, "total_tokens": 16333312} {"current_steps": 12490, "total_steps": 12855, "loss": 0.6204, "accuracy": 1.0, "learning_rate": 9.939472538657013e-08, "epoch": 0.9716063788409179, "percentage": 97.16, "elapsed_time": "5:38:10", "remaining_time": "0:09:52", "throughput": 805.61, "total_tokens": 16346000} {"current_steps": 12500, "total_steps": 12855, "loss": 0.7431, "accuracy": 1.0, "learning_rate": 9.402641553256375e-08, "epoch": 0.9723842862699339, "percentage": 97.24, "elapsed_time": "5:38:18", "remaining_time": "0:09:36", "throughput": 805.71, "total_tokens": 16354496} {"current_steps": 12510, "total_steps": 12855, "loss": 0.895, "accuracy": 1.0, "learning_rate": 8.880685633481656e-08, "epoch": 0.9731621936989499, "percentage": 97.32, "elapsed_time": "5:38:31", "remaining_time": "0:09:20", "throughput": 805.81, "total_tokens": 16367104} {"current_steps": 12520, "total_steps": 12855, "loss": 0.8349, "accuracy": 1.0, "learning_rate": 8.373607896708657e-08, "epoch": 0.9739401011279658, "percentage": 97.39, "elapsed_time": "5:38:44", "remaining_time": "0:09:03", "throughput": 805.88, "total_tokens": 16378816} {"current_steps": 12530, "total_steps": 12855, "loss": 0.9356, "accuracy": 1.0, "learning_rate": 7.881411371453707e-08, "epoch": 0.9747180085569818, "percentage": 97.47, "elapsed_time": "5:38:57", "remaining_time": "0:08:47", "throughput": 805.93, "total_tokens": 16390256} {"current_steps": 12540, "total_steps": 12855, "loss": 0.8335, "accuracy": 1.0, "learning_rate": 7.404098997355335e-08, "epoch": 0.9754959159859977, "percentage": 97.55, "elapsed_time": "5:39:14", "remaining_time": "0:08:31", "throughput": 805.9, "total_tokens": 16403888} {"current_steps": 12550, "total_steps": 12855, "loss": 1.0235, "accuracy": 1.0, "learning_rate": 6.94167362515652e-08, "epoch": 0.9762738234150136, "percentage": 97.63, "elapsed_time": "5:39:43", "remaining_time": "0:08:15", "throughput": 805.56, "total_tokens": 16419856} {"current_steps": 12560, "total_steps": 12855, "loss": 0.6919, "accuracy": 1.0, "learning_rate": 6.494138016687468e-08, "epoch": 0.9770517308440295, "percentage": 97.71, "elapsed_time": "5:40:04", "remaining_time": "0:07:59", "throughput": 805.63, "total_tokens": 16438128} {"current_steps": 12570, "total_steps": 12855, "loss": 0.7878, "accuracy": 0.8999999761581421, "learning_rate": 6.06149484485008e-08, "epoch": 0.9778296382730455, "percentage": 97.78, "elapsed_time": "5:40:17", "remaining_time": "0:07:42", "throughput": 805.66, "total_tokens": 16449392} {"current_steps": 12580, "total_steps": 12855, "loss": 1.1372, "accuracy": 1.0, "learning_rate": 5.643746693600738e-08, "epoch": 0.9786075457020614, "percentage": 97.86, "elapsed_time": "5:40:29", "remaining_time": "0:07:26", "throughput": 805.72, "total_tokens": 16460176} {"current_steps": 12590, "total_steps": 12855, "loss": 0.9705, "accuracy": 0.8999999761581421, "learning_rate": 5.240896057935596e-08, "epoch": 0.9793854531310774, "percentage": 97.94, "elapsed_time": "5:40:46", "remaining_time": "0:07:10", "throughput": 805.74, "total_tokens": 16474832} {"current_steps": 12600, "total_steps": 12855, "loss": 1.1277, "accuracy": 0.8999999761581421, "learning_rate": 4.852945343876147e-08, "epoch": 0.9801633605600933, "percentage": 98.02, "elapsed_time": "5:41:02", "remaining_time": "0:06:54", "throughput": 805.75, "total_tokens": 16487808} {"current_steps": 12610, "total_steps": 12855, "loss": 1.0389, "accuracy": 1.0, "learning_rate": 4.4798968684536816e-08, "epoch": 0.9809412679891093, "percentage": 98.09, "elapsed_time": "5:41:16", "remaining_time": "0:06:37", "throughput": 805.85, "total_tokens": 16500688} {"current_steps": 12620, "total_steps": 12855, "loss": 1.0095, "accuracy": 0.8999999761581421, "learning_rate": 4.12175285969596e-08, "epoch": 0.9817191754181253, "percentage": 98.17, "elapsed_time": "5:41:29", "remaining_time": "0:06:21", "throughput": 805.94, "total_tokens": 16513120} {"current_steps": 12630, "total_steps": 12855, "loss": 0.955, "accuracy": 1.0, "learning_rate": 3.7785154566141734e-08, "epoch": 0.9824970828471412, "percentage": 98.25, "elapsed_time": "5:41:48", "remaining_time": "0:06:05", "throughput": 805.97, "total_tokens": 16529152} {"current_steps": 12640, "total_steps": 12855, "loss": 1.4183, "accuracy": 0.8999999761581421, "learning_rate": 3.450186709190173e-08, "epoch": 0.9832749902761572, "percentage": 98.33, "elapsed_time": "5:42:28", "remaining_time": "0:05:49", "throughput": 805.23, "total_tokens": 16545968} {"current_steps": 12650, "total_steps": 12855, "loss": 0.8927, "accuracy": 1.0, "learning_rate": 3.1367685783637027e-08, "epoch": 0.9840528977051731, "percentage": 98.41, "elapsed_time": "5:42:46", "remaining_time": "0:05:33", "throughput": 805.17, "total_tokens": 16559760} {"current_steps": 12660, "total_steps": 12855, "loss": 0.7103, "accuracy": 1.0, "learning_rate": 2.8382629360212964e-08, "epoch": 0.9848308051341891, "percentage": 98.48, "elapsed_time": "5:43:03", "remaining_time": "0:05:17", "throughput": 805.19, "total_tokens": 16573264} {"current_steps": 12670, "total_steps": 12855, "loss": 0.8865, "accuracy": 0.800000011920929, "learning_rate": 2.5546715649843454e-08, "epoch": 0.9856087125632049, "percentage": 98.56, "elapsed_time": "5:43:15", "remaining_time": "0:05:00", "throughput": 805.22, "total_tokens": 16584240} {"current_steps": 12680, "total_steps": 12855, "loss": 0.9782, "accuracy": 0.8999999761581421, "learning_rate": 2.2859961589996592e-08, "epoch": 0.9863866199922209, "percentage": 98.64, "elapsed_time": "5:43:33", "remaining_time": "0:04:44", "throughput": 805.3, "total_tokens": 16599776} {"current_steps": 12690, "total_steps": 12855, "loss": 0.8853, "accuracy": 1.0, "learning_rate": 2.0322383227278085e-08, "epoch": 0.9871645274212368, "percentage": 98.72, "elapsed_time": "5:43:50", "remaining_time": "0:04:28", "throughput": 805.29, "total_tokens": 16613616} {"current_steps": 12700, "total_steps": 12855, "loss": 0.7783, "accuracy": 1.0, "learning_rate": 1.7933995717347996e-08, "epoch": 0.9879424348502528, "percentage": 98.79, "elapsed_time": "5:44:02", "remaining_time": "0:04:11", "throughput": 805.37, "total_tokens": 16624656} {"current_steps": 12710, "total_steps": 12855, "loss": 0.9228, "accuracy": 1.0, "learning_rate": 1.569481332482636e-08, "epoch": 0.9887203422792687, "percentage": 98.87, "elapsed_time": "5:44:22", "remaining_time": "0:03:55", "throughput": 805.38, "total_tokens": 16641136} {"current_steps": 12720, "total_steps": 12855, "loss": 0.8719, "accuracy": 1.0, "learning_rate": 1.3604849423201616e-08, "epoch": 0.9894982497082847, "percentage": 98.95, "elapsed_time": "5:44:37", "remaining_time": "0:03:39", "throughput": 805.49, "total_tokens": 16655472} {"current_steps": 12730, "total_steps": 12855, "loss": 0.8047, "accuracy": 0.800000011920929, "learning_rate": 1.166411649476673e-08, "epoch": 0.9902761571373007, "percentage": 99.03, "elapsed_time": "5:44:51", "remaining_time": "0:03:23", "throughput": 805.51, "total_tokens": 16666992} {"current_steps": 12740, "total_steps": 12855, "loss": 0.785, "accuracy": 1.0, "learning_rate": 9.87262613052209e-09, "epoch": 0.9910540645663166, "percentage": 99.11, "elapsed_time": "5:45:13", "remaining_time": "0:03:06", "throughput": 805.49, "total_tokens": 16684736} {"current_steps": 12750, "total_steps": 12855, "loss": 0.9037, "accuracy": 1.0, "learning_rate": 8.230389030128293e-09, "epoch": 0.9918319719953326, "percentage": 99.18, "elapsed_time": "5:45:35", "remaining_time": "0:02:50", "throughput": 805.46, "total_tokens": 16701296} {"current_steps": 12760, "total_steps": 12855, "loss": 0.9526, "accuracy": 1.0, "learning_rate": 6.7374150018256754e-09, "epoch": 0.9926098794243485, "percentage": 99.26, "elapsed_time": "5:45:49", "remaining_time": "0:02:34", "throughput": 805.51, "total_tokens": 16713664} {"current_steps": 12770, "total_steps": 12855, "loss": 0.6679, "accuracy": 1.0, "learning_rate": 5.39371296238711e-09, "epoch": 0.9933877868533645, "percentage": 99.34, "elapsed_time": "5:46:09", "remaining_time": "0:02:18", "throughput": 805.41, "total_tokens": 16727856} {"current_steps": 12780, "total_steps": 12855, "loss": 1.2418, "accuracy": 0.800000011920929, "learning_rate": 4.199290937056955e-09, "epoch": 0.9941656942823804, "percentage": 99.42, "elapsed_time": "5:46:27", "remaining_time": "0:02:01", "throughput": 805.33, "total_tokens": 16740848} {"current_steps": 12790, "total_steps": 12855, "loss": 0.9696, "accuracy": 1.0, "learning_rate": 3.154156059512192e-09, "epoch": 0.9949436017113964, "percentage": 99.49, "elapsed_time": "5:46:43", "remaining_time": "0:01:45", "throughput": 805.34, "total_tokens": 16754048} {"current_steps": 12800, "total_steps": 12855, "loss": 0.98, "accuracy": 0.8999999761581421, "learning_rate": 2.258314571804143e-09, "epoch": 0.9957215091404122, "percentage": 99.57, "elapsed_time": "5:47:04", "remaining_time": "0:01:29", "throughput": 805.25, "total_tokens": 16769024} {"current_steps": 12810, "total_steps": 12855, "loss": 0.9398, "accuracy": 1.0, "learning_rate": 1.511771824336261e-09, "epoch": 0.9964994165694282, "percentage": 99.65, "elapsed_time": "5:47:24", "remaining_time": "0:01:13", "throughput": 805.25, "total_tokens": 16784912} {"current_steps": 12820, "total_steps": 12855, "loss": 1.0175, "accuracy": 1.0, "learning_rate": 9.145322758308261e-10, "epoch": 0.9972773239984442, "percentage": 99.73, "elapsed_time": "5:47:42", "remaining_time": "0:00:56", "throughput": 805.26, "total_tokens": 16799360} {"current_steps": 12830, "total_steps": 12855, "loss": 0.8406, "accuracy": 1.0, "learning_rate": 4.665994932956385e-10, "epoch": 0.9980552314274601, "percentage": 99.81, "elapsed_time": "5:48:09", "remaining_time": "0:00:40", "throughput": 805.07, "total_tokens": 16817520} {"current_steps": 12840, "total_steps": 12855, "loss": 1.2627, "accuracy": 0.6000000238418579, "learning_rate": 1.679761519990386e-10, "epoch": 0.9988331388564761, "percentage": 99.88, "elapsed_time": "5:48:24", "remaining_time": "0:00:24", "throughput": 805.11, "total_tokens": 16830640} {"current_steps": 12850, "total_steps": 12855, "loss": 0.758, "accuracy": 1.0, "learning_rate": 1.8664035467130802e-11, "epoch": 0.999611046285492, "percentage": 99.96, "elapsed_time": "5:48:40", "remaining_time": "0:00:08", "throughput": 805.19, "total_tokens": 16844576} {"current_steps": 12855, "total_steps": 12855, "epoch": 1.0, "percentage": 100.0, "elapsed_time": "5:48:46", "remaining_time": "0:00:00", "throughput": 805.11, "total_tokens": 16848032}