{ "best_metric": 0.28454330563545227, "best_model_checkpoint": "joe611/chickens-60-epoch-1000-images-aug/checkpoint-28500", "epoch": 60.0, "eval_steps": 500, "global_step": 30000, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 0.06, "grad_norm": 51.12995529174805, "learning_rate": 9.999975326009292e-06, "loss": 1.7984, "step": 30 }, { "epoch": 0.12, "grad_norm": 264.590087890625, "learning_rate": 9.999901304280686e-06, "loss": 1.9316, "step": 60 }, { "epoch": 0.18, "grad_norm": 74.54895782470703, "learning_rate": 9.99977793554475e-06, "loss": 1.5595, "step": 90 }, { "epoch": 0.24, "grad_norm": 182.5364532470703, "learning_rate": 9.999605221019082e-06, "loss": 1.5981, "step": 120 }, { "epoch": 0.3, "grad_norm": 90.40423583984375, "learning_rate": 9.999383162408303e-06, "loss": 1.5708, "step": 150 }, { "epoch": 0.36, "grad_norm": 84.81971740722656, "learning_rate": 9.999111761904046e-06, "loss": 1.5353, "step": 180 }, { "epoch": 0.42, "grad_norm": 66.83992767333984, "learning_rate": 9.998791022184921e-06, "loss": 1.5156, "step": 210 }, { "epoch": 0.48, "grad_norm": 46.15699768066406, "learning_rate": 9.9984209464165e-06, "loss": 1.5476, "step": 240 }, { "epoch": 0.54, "grad_norm": 374.46685791015625, "learning_rate": 9.998001538251283e-06, "loss": 1.4349, "step": 270 }, { "epoch": 0.6, "grad_norm": 34.38185119628906, "learning_rate": 9.997532801828659e-06, "loss": 1.4334, "step": 300 }, { "epoch": 0.66, "grad_norm": 57.43722152709961, "learning_rate": 9.997014741774866e-06, "loss": 1.4666, "step": 330 }, { "epoch": 0.72, "grad_norm": 114.363525390625, "learning_rate": 9.996447363202947e-06, "loss": 1.2964, "step": 360 }, { "epoch": 0.78, "grad_norm": 74.82312774658203, "learning_rate": 9.995830671712701e-06, "loss": 1.307, "step": 390 }, { "epoch": 0.84, "grad_norm": 87.48751068115234, "learning_rate": 9.995164673390624e-06, "loss": 1.2696, "step": 420 }, { "epoch": 0.9, "grad_norm": 50.108421325683594, "learning_rate": 9.994449374809851e-06, "loss": 1.1757, "step": 450 }, { "epoch": 0.96, "grad_norm": 63.529415130615234, "learning_rate": 9.99368478303009e-06, "loss": 1.4811, "step": 480 }, { "epoch": 1.0, "eval_loss": 1.3713055849075317, "eval_map": 0.0772, "eval_map_50": 0.1135, "eval_map_75": 0.0875, "eval_map_chicken": 0.0069, "eval_map_duck": 0.0, "eval_map_large": 0.3534, "eval_map_medium": 0.0389, "eval_map_plant": 0.2247, "eval_map_small": 0.004, "eval_mar_1": 0.0527, "eval_mar_10": 0.1857, "eval_mar_100": 0.2513, "eval_mar_100_chicken": 0.0062, "eval_mar_100_duck": 0.0, "eval_mar_100_plant": 0.7476, "eval_mar_large": 0.7937, "eval_mar_medium": 0.2276, "eval_mar_small": 0.0875, "eval_runtime": 5.1266, "eval_samples_per_second": 19.506, "eval_steps_per_second": 2.536, "step": 500 }, { "epoch": 1.02, "grad_norm": 48.37826156616211, "learning_rate": 9.992870905597549e-06, "loss": 1.2844, "step": 510 }, { "epoch": 1.08, "grad_norm": 52.364105224609375, "learning_rate": 9.992007750544876e-06, "loss": 1.291, "step": 540 }, { "epoch": 1.1400000000000001, "grad_norm": 121.01571655273438, "learning_rate": 9.991095326391061e-06, "loss": 1.1206, "step": 570 }, { "epoch": 1.2, "grad_norm": 57.15728759765625, "learning_rate": 9.990133642141359e-06, "loss": 1.3043, "step": 600 }, { "epoch": 1.26, "grad_norm": 142.0693817138672, "learning_rate": 9.98912270728721e-06, "loss": 1.3167, "step": 630 }, { "epoch": 1.32, "grad_norm": 141.81764221191406, "learning_rate": 9.988062531806127e-06, "loss": 1.295, "step": 660 }, { "epoch": 1.38, "grad_norm": 78.71722412109375, "learning_rate": 9.98695312616162e-06, "loss": 1.3064, "step": 690 }, { "epoch": 1.44, "grad_norm": 67.82110595703125, "learning_rate": 9.98579450130307e-06, "loss": 1.0711, "step": 720 }, { "epoch": 1.5, "grad_norm": 125.79237365722656, "learning_rate": 9.984586668665641e-06, "loss": 1.1637, "step": 750 }, { "epoch": 1.56, "grad_norm": 66.8957748413086, "learning_rate": 9.98332964017015e-06, "loss": 1.1349, "step": 780 }, { "epoch": 1.62, "grad_norm": 77.45892333984375, "learning_rate": 9.982023428222963e-06, "loss": 1.0902, "step": 810 }, { "epoch": 1.6800000000000002, "grad_norm": 77.51893615722656, "learning_rate": 9.980668045715864e-06, "loss": 1.2707, "step": 840 }, { "epoch": 1.74, "grad_norm": 52.3269157409668, "learning_rate": 9.97926350602593e-06, "loss": 1.1578, "step": 870 }, { "epoch": 1.8, "grad_norm": 50.24958419799805, "learning_rate": 9.9778098230154e-06, "loss": 1.1071, "step": 900 }, { "epoch": 1.8599999999999999, "grad_norm": 90.0967788696289, "learning_rate": 9.976307011031542e-06, "loss": 1.251, "step": 930 }, { "epoch": 1.92, "grad_norm": 174.36660766601562, "learning_rate": 9.974755084906503e-06, "loss": 1.05, "step": 960 }, { "epoch": 1.98, "grad_norm": 78.29364013671875, "learning_rate": 9.973154059957162e-06, "loss": 1.093, "step": 990 }, { "epoch": 2.0, "eval_loss": 1.1410857439041138, "eval_map": 0.1941, "eval_map_50": 0.2637, "eval_map_75": 0.221, "eval_map_chicken": 0.0, "eval_map_duck": 0.0, "eval_map_large": 0.6715, "eval_map_medium": 0.134, "eval_map_plant": 0.5822, "eval_map_small": 0.0042, "eval_mar_1": 0.0688, "eval_mar_10": 0.2331, "eval_mar_100": 0.2586, "eval_mar_100_chicken": 0.0, "eval_mar_100_duck": 0.0, "eval_mar_100_plant": 0.7758, "eval_mar_large": 0.8259, "eval_mar_medium": 0.23, "eval_mar_small": 0.1167, "eval_runtime": 4.9547, "eval_samples_per_second": 20.183, "eval_steps_per_second": 2.624, "step": 1000 }, { "epoch": 2.04, "grad_norm": 69.85189056396484, "learning_rate": 9.971503951984996e-06, "loss": 1.1616, "step": 1020 }, { "epoch": 2.1, "grad_norm": 37.134403228759766, "learning_rate": 9.9698047772759e-06, "loss": 1.0393, "step": 1050 }, { "epoch": 2.16, "grad_norm": 52.74504852294922, "learning_rate": 9.968056552600043e-06, "loss": 1.1147, "step": 1080 }, { "epoch": 2.22, "grad_norm": 70.72219848632812, "learning_rate": 9.966259295211698e-06, "loss": 1.0797, "step": 1110 }, { "epoch": 2.2800000000000002, "grad_norm": 104.32415771484375, "learning_rate": 9.964413022849069e-06, "loss": 0.9984, "step": 1140 }, { "epoch": 2.34, "grad_norm": 65.52819061279297, "learning_rate": 9.96251775373412e-06, "loss": 1.036, "step": 1170 }, { "epoch": 2.4, "grad_norm": 43.15259552001953, "learning_rate": 9.960573506572391e-06, "loss": 1.3154, "step": 1200 }, { "epoch": 2.46, "grad_norm": 76.51600646972656, "learning_rate": 9.958580300552816e-06, "loss": 1.1412, "step": 1230 }, { "epoch": 2.52, "grad_norm": 0.6177086234092712, "learning_rate": 9.956538155347534e-06, "loss": 1.2674, "step": 1260 }, { "epoch": 2.58, "grad_norm": 53.222103118896484, "learning_rate": 9.954447091111695e-06, "loss": 1.1138, "step": 1290 }, { "epoch": 2.64, "grad_norm": 94.70368194580078, "learning_rate": 9.952307128483257e-06, "loss": 1.0613, "step": 1320 }, { "epoch": 2.7, "grad_norm": 89.58301544189453, "learning_rate": 9.95011828858279e-06, "loss": 1.0912, "step": 1350 }, { "epoch": 2.76, "grad_norm": 43.07695388793945, "learning_rate": 9.947880593013256e-06, "loss": 1.1115, "step": 1380 }, { "epoch": 2.82, "grad_norm": 52.474220275878906, "learning_rate": 9.94559406385981e-06, "loss": 0.9757, "step": 1410 }, { "epoch": 2.88, "grad_norm": 46.698448181152344, "learning_rate": 9.94325872368957e-06, "loss": 1.1364, "step": 1440 }, { "epoch": 2.94, "grad_norm": 49.13819885253906, "learning_rate": 9.940874595551403e-06, "loss": 0.9772, "step": 1470 }, { "epoch": 3.0, "grad_norm": 101.07115173339844, "learning_rate": 9.938441702975689e-06, "loss": 1.06, "step": 1500 }, { "epoch": 3.0, "eval_loss": 1.5299323797225952, "eval_map": 0.1865, "eval_map_50": 0.2571, "eval_map_75": 0.2063, "eval_map_chicken": 0.0, "eval_map_duck": 0.0, "eval_map_large": 0.6155, "eval_map_medium": 0.1497, "eval_map_plant": 0.5595, "eval_map_small": 0.0172, "eval_mar_1": 0.0695, "eval_mar_10": 0.2154, "eval_mar_100": 0.2187, "eval_mar_100_chicken": 0.0, "eval_mar_100_duck": 0.0, "eval_mar_100_plant": 0.6562, "eval_mar_large": 0.6971, "eval_mar_medium": 0.199, "eval_mar_small": 0.0583, "eval_runtime": 4.9962, "eval_samples_per_second": 20.015, "eval_steps_per_second": 2.602, "step": 1500 }, { "epoch": 3.06, "grad_norm": 96.25062561035156, "learning_rate": 9.935960069974096e-06, "loss": 1.2809, "step": 1530 }, { "epoch": 3.12, "grad_norm": 90.79141235351562, "learning_rate": 9.93342972103934e-06, "loss": 0.9711, "step": 1560 }, { "epoch": 3.18, "grad_norm": 87.00637817382812, "learning_rate": 9.930850681144946e-06, "loss": 1.0352, "step": 1590 }, { "epoch": 3.24, "grad_norm": 64.22712707519531, "learning_rate": 9.928222975744992e-06, "loss": 1.0759, "step": 1620 }, { "epoch": 3.3, "grad_norm": 38.713409423828125, "learning_rate": 9.92554663077387e-06, "loss": 1.2278, "step": 1650 }, { "epoch": 3.36, "grad_norm": 346.5014343261719, "learning_rate": 9.922821672646028e-06, "loss": 0.8572, "step": 1680 }, { "epoch": 3.42, "grad_norm": 42.0444450378418, "learning_rate": 9.920048128255699e-06, "loss": 0.9703, "step": 1710 }, { "epoch": 3.48, "grad_norm": 43.47895431518555, "learning_rate": 9.91722602497665e-06, "loss": 1.0172, "step": 1740 }, { "epoch": 3.54, "grad_norm": 47.463985443115234, "learning_rate": 9.914355390661897e-06, "loss": 1.0251, "step": 1770 }, { "epoch": 3.6, "grad_norm": 98.45388793945312, "learning_rate": 9.911436253643445e-06, "loss": 0.8112, "step": 1800 }, { "epoch": 3.66, "grad_norm": 47.29812240600586, "learning_rate": 9.908468642731996e-06, "loss": 1.0115, "step": 1830 }, { "epoch": 3.7199999999999998, "grad_norm": 65.47380065917969, "learning_rate": 9.90545258721667e-06, "loss": 1.1073, "step": 1860 }, { "epoch": 3.7800000000000002, "grad_norm": 36.47480010986328, "learning_rate": 9.902388116864723e-06, "loss": 1.1526, "step": 1890 }, { "epoch": 3.84, "grad_norm": 70.70551300048828, "learning_rate": 9.899275261921236e-06, "loss": 0.8749, "step": 1920 }, { "epoch": 3.9, "grad_norm": 41.91495132446289, "learning_rate": 9.89611405310883e-06, "loss": 0.8569, "step": 1950 }, { "epoch": 3.96, "grad_norm": 61.9908561706543, "learning_rate": 9.89290452162736e-06, "loss": 0.866, "step": 1980 }, { "epoch": 4.0, "eval_loss": 1.0132447481155396, "eval_map": 0.2298, "eval_map_50": 0.307, "eval_map_75": 0.2534, "eval_map_chicken": 0.0329, "eval_map_duck": 0.0, "eval_map_large": 0.7269, "eval_map_medium": 0.1936, "eval_map_plant": 0.6564, "eval_map_small": 0.0251, "eval_mar_1": 0.0897, "eval_mar_10": 0.2671, "eval_mar_100": 0.2739, "eval_mar_100_chicken": 0.0613, "eval_mar_100_duck": 0.0, "eval_mar_100_plant": 0.7602, "eval_mar_large": 0.8172, "eval_mar_medium": 0.2449, "eval_mar_small": 0.0688, "eval_runtime": 5.0087, "eval_samples_per_second": 19.965, "eval_steps_per_second": 2.595, "step": 2000 }, { "epoch": 4.02, "grad_norm": 65.72293853759766, "learning_rate": 9.88964669915361e-06, "loss": 1.0872, "step": 2010 }, { "epoch": 4.08, "grad_norm": 126.20653533935547, "learning_rate": 9.886340617840968e-06, "loss": 1.0516, "step": 2040 }, { "epoch": 4.14, "grad_norm": 62.30933380126953, "learning_rate": 9.882986310319124e-06, "loss": 0.993, "step": 2070 }, { "epoch": 4.2, "grad_norm": 62.221160888671875, "learning_rate": 9.879583809693737e-06, "loss": 1.0601, "step": 2100 }, { "epoch": 4.26, "grad_norm": 55.73953628540039, "learning_rate": 9.876133149546117e-06, "loss": 0.7821, "step": 2130 }, { "epoch": 4.32, "grad_norm": 57.795196533203125, "learning_rate": 9.872634363932887e-06, "loss": 0.9674, "step": 2160 }, { "epoch": 4.38, "grad_norm": 49.45548629760742, "learning_rate": 9.869087487385644e-06, "loss": 0.8739, "step": 2190 }, { "epoch": 4.44, "grad_norm": 55.93813705444336, "learning_rate": 9.865492554910634e-06, "loss": 0.9908, "step": 2220 }, { "epoch": 4.5, "grad_norm": 55.131141662597656, "learning_rate": 9.861849601988384e-06, "loss": 0.9069, "step": 2250 }, { "epoch": 4.5600000000000005, "grad_norm": 45.55573272705078, "learning_rate": 9.85815866457337e-06, "loss": 0.9796, "step": 2280 }, { "epoch": 4.62, "grad_norm": 41.95097732543945, "learning_rate": 9.854419779093656e-06, "loss": 0.8175, "step": 2310 }, { "epoch": 4.68, "grad_norm": 480.2862243652344, "learning_rate": 9.85063298245053e-06, "loss": 0.8588, "step": 2340 }, { "epoch": 4.74, "grad_norm": 51.55152893066406, "learning_rate": 9.846798312018147e-06, "loss": 0.9936, "step": 2370 }, { "epoch": 4.8, "grad_norm": 36.979496002197266, "learning_rate": 9.842915805643156e-06, "loss": 0.9615, "step": 2400 }, { "epoch": 4.86, "grad_norm": 47.84645462036133, "learning_rate": 9.838985501644329e-06, "loss": 0.8042, "step": 2430 }, { "epoch": 4.92, "grad_norm": 40.069725036621094, "learning_rate": 9.835007438812177e-06, "loss": 0.9539, "step": 2460 }, { "epoch": 4.98, "grad_norm": 86.61743927001953, "learning_rate": 9.830981656408575e-06, "loss": 0.8301, "step": 2490 }, { "epoch": 5.0, "eval_loss": 0.9037431478500366, "eval_map": 0.2895, "eval_map_50": 0.3972, "eval_map_75": 0.3375, "eval_map_chicken": 0.2025, "eval_map_duck": 0.0, "eval_map_large": 0.7397, "eval_map_medium": 0.25, "eval_map_plant": 0.6662, "eval_map_small": 0.0486, "eval_mar_1": 0.1158, "eval_mar_10": 0.3495, "eval_mar_100": 0.3568, "eval_mar_100_chicken": 0.3062, "eval_mar_100_duck": 0.0, "eval_mar_100_plant": 0.7643, "eval_mar_large": 0.8305, "eval_mar_medium": 0.3238, "eval_mar_small": 0.1063, "eval_runtime": 4.9996, "eval_samples_per_second": 20.002, "eval_steps_per_second": 2.6, "step": 2500 }, { "epoch": 5.04, "grad_norm": 69.0333251953125, "learning_rate": 9.82690819416637e-06, "loss": 0.933, "step": 2520 }, { "epoch": 5.1, "grad_norm": 38.97633743286133, "learning_rate": 9.822787092288991e-06, "loss": 1.0335, "step": 2550 }, { "epoch": 5.16, "grad_norm": 52.52025604248047, "learning_rate": 9.81861839145005e-06, "loss": 0.9546, "step": 2580 }, { "epoch": 5.22, "grad_norm": 68.2970962524414, "learning_rate": 9.814402132792939e-06, "loss": 0.8876, "step": 2610 }, { "epoch": 5.28, "grad_norm": 89.29615783691406, "learning_rate": 9.81013835793043e-06, "loss": 0.9496, "step": 2640 }, { "epoch": 5.34, "grad_norm": 50.56565475463867, "learning_rate": 9.80582710894426e-06, "loss": 0.7895, "step": 2670 }, { "epoch": 5.4, "grad_norm": 33.971832275390625, "learning_rate": 9.801468428384716e-06, "loss": 0.9679, "step": 2700 }, { "epoch": 5.46, "grad_norm": 45.445594787597656, "learning_rate": 9.797062359270215e-06, "loss": 0.924, "step": 2730 }, { "epoch": 5.52, "grad_norm": 45.259674072265625, "learning_rate": 9.79260894508688e-06, "loss": 0.9305, "step": 2760 }, { "epoch": 5.58, "grad_norm": 42.04433059692383, "learning_rate": 9.788108229788111e-06, "loss": 0.9169, "step": 2790 }, { "epoch": 5.64, "grad_norm": 109.8760986328125, "learning_rate": 9.783560257794153e-06, "loss": 1.2765, "step": 2820 }, { "epoch": 5.7, "grad_norm": 63.83809280395508, "learning_rate": 9.778965073991652e-06, "loss": 1.2013, "step": 2850 }, { "epoch": 5.76, "grad_norm": 205.1379852294922, "learning_rate": 9.774322723733216e-06, "loss": 0.9418, "step": 2880 }, { "epoch": 5.82, "grad_norm": 23.930816650390625, "learning_rate": 9.769633252836969e-06, "loss": 0.8923, "step": 2910 }, { "epoch": 5.88, "grad_norm": 39.413909912109375, "learning_rate": 9.764896707586095e-06, "loss": 0.8823, "step": 2940 }, { "epoch": 5.9399999999999995, "grad_norm": 111.26641845703125, "learning_rate": 9.760113134728383e-06, "loss": 0.9271, "step": 2970 }, { "epoch": 6.0, "grad_norm": 83.30919647216797, "learning_rate": 9.755282581475769e-06, "loss": 0.8386, "step": 3000 }, { "epoch": 6.0, "eval_loss": 0.9659404158592224, "eval_map": 0.3229, "eval_map_50": 0.4625, "eval_map_75": 0.3953, "eval_map_chicken": 0.3161, "eval_map_duck": 0.0, "eval_map_large": 0.7146, "eval_map_medium": 0.2944, "eval_map_plant": 0.6527, "eval_map_small": 0.012, "eval_mar_1": 0.1161, "eval_mar_10": 0.3938, "eval_mar_100": 0.3977, "eval_mar_100_chicken": 0.4693, "eval_mar_100_duck": 0.0, "eval_mar_100_plant": 0.7236, "eval_mar_large": 0.7837, "eval_mar_medium": 0.3785, "eval_mar_small": 0.0333, "eval_runtime": 4.9283, "eval_samples_per_second": 20.291, "eval_steps_per_second": 2.638, "step": 3000 }, { "epoch": 6.06, "grad_norm": 34.77956008911133, "learning_rate": 9.750405095503859e-06, "loss": 0.9097, "step": 3030 }, { "epoch": 6.12, "grad_norm": 41.7236328125, "learning_rate": 9.745480724951473e-06, "loss": 0.7642, "step": 3060 }, { "epoch": 6.18, "grad_norm": 21.034090042114258, "learning_rate": 9.74050951842016e-06, "loss": 0.8596, "step": 3090 }, { "epoch": 6.24, "grad_norm": 36.62574005126953, "learning_rate": 9.735491524973723e-06, "loss": 0.8173, "step": 3120 }, { "epoch": 6.3, "grad_norm": 89.44732666015625, "learning_rate": 9.730426794137727e-06, "loss": 0.856, "step": 3150 }, { "epoch": 6.36, "grad_norm": 56.18183898925781, "learning_rate": 9.725315375899025e-06, "loss": 0.8138, "step": 3180 }, { "epoch": 6.42, "grad_norm": 41.0568962097168, "learning_rate": 9.72015732070525e-06, "loss": 0.8276, "step": 3210 }, { "epoch": 6.48, "grad_norm": 76.43619537353516, "learning_rate": 9.714952679464324e-06, "loss": 0.8188, "step": 3240 }, { "epoch": 6.54, "grad_norm": 39.30849075317383, "learning_rate": 9.709701503543954e-06, "loss": 0.7778, "step": 3270 }, { "epoch": 6.6, "grad_norm": 71.78713989257812, "learning_rate": 9.704403844771128e-06, "loss": 0.8526, "step": 3300 }, { "epoch": 6.66, "grad_norm": 68.13652038574219, "learning_rate": 9.699059755431599e-06, "loss": 0.871, "step": 3330 }, { "epoch": 6.72, "grad_norm": 158.08872985839844, "learning_rate": 9.693669288269371e-06, "loss": 1.1321, "step": 3360 }, { "epoch": 6.78, "grad_norm": 34.7762451171875, "learning_rate": 9.688232496486179e-06, "loss": 0.8604, "step": 3390 }, { "epoch": 6.84, "grad_norm": 42.608489990234375, "learning_rate": 9.682749433740963e-06, "loss": 0.9493, "step": 3420 }, { "epoch": 6.9, "grad_norm": 0.026101410388946533, "learning_rate": 9.677220154149338e-06, "loss": 0.7639, "step": 3450 }, { "epoch": 6.96, "grad_norm": 147.83847045898438, "learning_rate": 9.671644712283061e-06, "loss": 0.9838, "step": 3480 }, { "epoch": 7.0, "eval_loss": 0.7706183791160583, "eval_map": 0.3831, "eval_map_50": 0.5318, "eval_map_75": 0.4649, "eval_map_chicken": 0.4609, "eval_map_duck": 0.0, "eval_map_large": 0.7573, "eval_map_medium": 0.3525, "eval_map_plant": 0.6886, "eval_map_small": 0.0314, "eval_mar_1": 0.1347, "eval_mar_10": 0.4783, "eval_mar_100": 0.4829, "eval_mar_100_chicken": 0.6889, "eval_mar_100_duck": 0.0, "eval_mar_100_plant": 0.7599, "eval_mar_large": 0.8234, "eval_mar_medium": 0.4636, "eval_mar_small": 0.0854, "eval_runtime": 5.0062, "eval_samples_per_second": 19.975, "eval_steps_per_second": 2.597, "step": 3500 }, { "epoch": 7.02, "grad_norm": 55.403541564941406, "learning_rate": 9.666023163169493e-06, "loss": 0.8917, "step": 3510 }, { "epoch": 7.08, "grad_norm": 189.77401733398438, "learning_rate": 9.660355562291055e-06, "loss": 0.858, "step": 3540 }, { "epoch": 7.14, "grad_norm": 58.92485427856445, "learning_rate": 9.65464196558468e-06, "loss": 0.7254, "step": 3570 }, { "epoch": 7.2, "grad_norm": 46.30803298950195, "learning_rate": 9.648882429441258e-06, "loss": 0.7928, "step": 3600 }, { "epoch": 7.26, "grad_norm": 111.99207305908203, "learning_rate": 9.643077010705088e-06, "loss": 0.7594, "step": 3630 }, { "epoch": 7.32, "grad_norm": 72.06273651123047, "learning_rate": 9.637225766673309e-06, "loss": 0.8397, "step": 3660 }, { "epoch": 7.38, "grad_norm": 35.78024673461914, "learning_rate": 9.631328755095334e-06, "loss": 0.8906, "step": 3690 }, { "epoch": 7.44, "grad_norm": 140.4214630126953, "learning_rate": 9.62538603417229e-06, "loss": 0.6961, "step": 3720 }, { "epoch": 7.5, "grad_norm": 55.60920715332031, "learning_rate": 9.619397662556434e-06, "loss": 0.7646, "step": 3750 }, { "epoch": 7.5600000000000005, "grad_norm": 43.936187744140625, "learning_rate": 9.613363699350575e-06, "loss": 0.8446, "step": 3780 }, { "epoch": 7.62, "grad_norm": 61.2660026550293, "learning_rate": 9.607284204107493e-06, "loss": 0.7357, "step": 3810 }, { "epoch": 7.68, "grad_norm": 55.53911209106445, "learning_rate": 9.601159236829353e-06, "loss": 0.7807, "step": 3840 }, { "epoch": 7.74, "grad_norm": 86.03663635253906, "learning_rate": 9.594988857967107e-06, "loss": 0.9694, "step": 3870 }, { "epoch": 7.8, "grad_norm": 37.17007064819336, "learning_rate": 9.588773128419907e-06, "loss": 0.754, "step": 3900 }, { "epoch": 7.86, "grad_norm": 47.19321060180664, "learning_rate": 9.58251210953449e-06, "loss": 1.0753, "step": 3930 }, { "epoch": 7.92, "grad_norm": 51.06205368041992, "learning_rate": 9.576205863104588e-06, "loss": 0.8297, "step": 3960 }, { "epoch": 7.98, "grad_norm": 60.964874267578125, "learning_rate": 9.569854451370306e-06, "loss": 0.8051, "step": 3990 }, { "epoch": 8.0, "eval_loss": 0.7423961758613586, "eval_map": 0.3909, "eval_map_50": 0.5361, "eval_map_75": 0.4744, "eval_map_chicken": 0.4864, "eval_map_duck": 0.0, "eval_map_large": 0.7506, "eval_map_medium": 0.362, "eval_map_plant": 0.6864, "eval_map_small": 0.0298, "eval_mar_1": 0.1396, "eval_mar_10": 0.489, "eval_mar_100": 0.4921, "eval_mar_100_chicken": 0.712, "eval_mar_100_duck": 0.0, "eval_mar_100_plant": 0.7643, "eval_mar_large": 0.8222, "eval_mar_medium": 0.4762, "eval_mar_small": 0.1063, "eval_runtime": 5.1458, "eval_samples_per_second": 19.433, "eval_steps_per_second": 2.526, "step": 4000 }, { "epoch": 8.04, "grad_norm": 34.82122802734375, "learning_rate": 9.563457937017514e-06, "loss": 0.8709, "step": 4020 }, { "epoch": 8.1, "grad_norm": 97.54671478271484, "learning_rate": 9.557016383177226e-06, "loss": 0.9338, "step": 4050 }, { "epoch": 8.16, "grad_norm": 38.53603744506836, "learning_rate": 9.550529853424979e-06, "loss": 0.8831, "step": 4080 }, { "epoch": 8.22, "grad_norm": 55.73428726196289, "learning_rate": 9.543998411780202e-06, "loss": 0.7674, "step": 4110 }, { "epoch": 8.28, "grad_norm": 29.146512985229492, "learning_rate": 9.537422122705585e-06, "loss": 1.1078, "step": 4140 }, { "epoch": 8.34, "grad_norm": 119.19530487060547, "learning_rate": 9.530801051106449e-06, "loss": 0.6341, "step": 4170 }, { "epoch": 8.4, "grad_norm": 66.55436706542969, "learning_rate": 9.524135262330098e-06, "loss": 0.7727, "step": 4200 }, { "epoch": 8.46, "grad_norm": 108.39798736572266, "learning_rate": 9.517424822165175e-06, "loss": 0.8202, "step": 4230 }, { "epoch": 8.52, "grad_norm": 47.83013916015625, "learning_rate": 9.510669796841014e-06, "loss": 0.9373, "step": 4260 }, { "epoch": 8.58, "grad_norm": 57.3923225402832, "learning_rate": 9.503870253026992e-06, "loss": 0.6963, "step": 4290 }, { "epoch": 8.64, "grad_norm": 47.453041076660156, "learning_rate": 9.497026257831856e-06, "loss": 0.7835, "step": 4320 }, { "epoch": 8.7, "grad_norm": 50.4648551940918, "learning_rate": 9.490137878803078e-06, "loss": 0.6982, "step": 4350 }, { "epoch": 8.76, "grad_norm": 67.14995574951172, "learning_rate": 9.48320518392618e-06, "loss": 0.8588, "step": 4380 }, { "epoch": 8.82, "grad_norm": 61.14694595336914, "learning_rate": 9.476228241624059e-06, "loss": 0.7882, "step": 4410 }, { "epoch": 8.88, "grad_norm": 26.730520248413086, "learning_rate": 9.46920712075632e-06, "loss": 0.8078, "step": 4440 }, { "epoch": 8.94, "grad_norm": 66.36459350585938, "learning_rate": 9.46214189061859e-06, "loss": 0.7777, "step": 4470 }, { "epoch": 9.0, "grad_norm": 0.00832737423479557, "learning_rate": 9.45503262094184e-06, "loss": 0.7114, "step": 4500 }, { "epoch": 9.0, "eval_loss": 0.6859935522079468, "eval_map": 0.425, "eval_map_50": 0.5595, "eval_map_75": 0.5062, "eval_map_chicken": 0.5552, "eval_map_duck": 0.0, "eval_map_large": 0.7822, "eval_map_medium": 0.4023, "eval_map_plant": 0.7197, "eval_map_small": 0.0656, "eval_mar_1": 0.1429, "eval_mar_10": 0.5123, "eval_mar_100": 0.5168, "eval_mar_100_chicken": 0.7609, "eval_mar_100_duck": 0.0, "eval_mar_100_plant": 0.7896, "eval_mar_large": 0.849, "eval_mar_medium": 0.5014, "eval_mar_small": 0.1104, "eval_runtime": 4.9198, "eval_samples_per_second": 20.326, "eval_steps_per_second": 2.642, "step": 4500 }, { "epoch": 9.06, "grad_norm": 41.9913215637207, "learning_rate": 9.447879381891691e-06, "loss": 0.742, "step": 4530 }, { "epoch": 9.12, "grad_norm": 118.60945892333984, "learning_rate": 9.440682244067724e-06, "loss": 0.7156, "step": 4560 }, { "epoch": 9.18, "grad_norm": 46.92107009887695, "learning_rate": 9.433441278502784e-06, "loss": 0.7649, "step": 4590 }, { "epoch": 9.24, "grad_norm": 47.721012115478516, "learning_rate": 9.426156556662276e-06, "loss": 0.7351, "step": 4620 }, { "epoch": 9.3, "grad_norm": 32.733455657958984, "learning_rate": 9.418828150443469e-06, "loss": 0.7486, "step": 4650 }, { "epoch": 9.36, "grad_norm": 96.80855560302734, "learning_rate": 9.411456132174768e-06, "loss": 0.7729, "step": 4680 }, { "epoch": 9.42, "grad_norm": 37.33518981933594, "learning_rate": 9.404040574615018e-06, "loss": 0.7362, "step": 4710 }, { "epoch": 9.48, "grad_norm": 43.71377182006836, "learning_rate": 9.396581550952781e-06, "loss": 0.6084, "step": 4740 }, { "epoch": 9.54, "grad_norm": 98.9687728881836, "learning_rate": 9.38907913480561e-06, "loss": 0.8131, "step": 4770 }, { "epoch": 9.6, "grad_norm": 40.247962951660156, "learning_rate": 9.381533400219319e-06, "loss": 0.7444, "step": 4800 }, { "epoch": 9.66, "grad_norm": 48.69584655761719, "learning_rate": 9.373944421667264e-06, "loss": 0.8159, "step": 4830 }, { "epoch": 9.72, "grad_norm": 30.084497451782227, "learning_rate": 9.366312274049602e-06, "loss": 0.7879, "step": 4860 }, { "epoch": 9.78, "grad_norm": 55.0740966796875, "learning_rate": 9.358637032692546e-06, "loss": 0.7506, "step": 4890 }, { "epoch": 9.84, "grad_norm": 116.40509796142578, "learning_rate": 9.35091877334763e-06, "loss": 0.6648, "step": 4920 }, { "epoch": 9.9, "grad_norm": 134.0435791015625, "learning_rate": 9.343157572190957e-06, "loss": 0.7205, "step": 4950 }, { "epoch": 9.96, "grad_norm": 60.22429656982422, "learning_rate": 9.33535350582245e-06, "loss": 0.8088, "step": 4980 }, { "epoch": 10.0, "eval_loss": 0.6922460794448853, "eval_map": 0.4107, "eval_map_50": 0.5706, "eval_map_75": 0.5008, "eval_map_chicken": 0.527, "eval_map_duck": 0.0, "eval_map_large": 0.7653, "eval_map_medium": 0.3953, "eval_map_plant": 0.705, "eval_map_small": 0.0425, "eval_mar_1": 0.1375, "eval_mar_10": 0.4929, "eval_mar_100": 0.4981, "eval_mar_100_chicken": 0.7218, "eval_mar_100_duck": 0.0, "eval_mar_100_plant": 0.7726, "eval_mar_large": 0.8272, "eval_mar_medium": 0.4833, "eval_mar_small": 0.1333, "eval_runtime": 5.2996, "eval_samples_per_second": 18.869, "eval_steps_per_second": 2.453, "step": 5000 }, { "epoch": 10.02, "grad_norm": 79.86975860595703, "learning_rate": 9.327506651265096e-06, "loss": 0.6511, "step": 5010 }, { "epoch": 10.08, "grad_norm": 101.35730743408203, "learning_rate": 9.319617085964177e-06, "loss": 0.6866, "step": 5040 }, { "epoch": 10.14, "grad_norm": 50.54615783691406, "learning_rate": 9.31168488778652e-06, "loss": 0.7279, "step": 5070 }, { "epoch": 10.2, "grad_norm": 0.004792827181518078, "learning_rate": 9.30371013501972e-06, "loss": 0.8451, "step": 5100 }, { "epoch": 10.26, "grad_norm": 65.52108764648438, "learning_rate": 9.295692906371362e-06, "loss": 0.7139, "step": 5130 }, { "epoch": 10.32, "grad_norm": 50.15769577026367, "learning_rate": 9.287633280968263e-06, "loss": 0.7791, "step": 5160 }, { "epoch": 10.38, "grad_norm": 41.1558952331543, "learning_rate": 9.279531338355666e-06, "loss": 0.7288, "step": 5190 }, { "epoch": 10.44, "grad_norm": 91.48247528076172, "learning_rate": 9.271387158496477e-06, "loss": 0.7832, "step": 5220 }, { "epoch": 10.5, "grad_norm": 53.355899810791016, "learning_rate": 9.263200821770462e-06, "loss": 0.8104, "step": 5250 }, { "epoch": 10.56, "grad_norm": 36.56712341308594, "learning_rate": 9.25497240897346e-06, "loss": 0.7152, "step": 5280 }, { "epoch": 10.62, "grad_norm": 0.004473070148378611, "learning_rate": 9.246702001316584e-06, "loss": 0.7701, "step": 5310 }, { "epoch": 10.68, "grad_norm": 93.80265808105469, "learning_rate": 9.238389680425417e-06, "loss": 0.6912, "step": 5340 }, { "epoch": 10.74, "grad_norm": 80.67282104492188, "learning_rate": 9.230035528339212e-06, "loss": 0.7225, "step": 5370 }, { "epoch": 10.8, "grad_norm": 66.9299545288086, "learning_rate": 9.221639627510076e-06, "loss": 0.6667, "step": 5400 }, { "epoch": 10.86, "grad_norm": 63.10317611694336, "learning_rate": 9.213202060802162e-06, "loss": 0.7136, "step": 5430 }, { "epoch": 10.92, "grad_norm": 53.23859786987305, "learning_rate": 9.204722911490847e-06, "loss": 0.7137, "step": 5460 }, { "epoch": 10.98, "grad_norm": 72.44120025634766, "learning_rate": 9.196202263261908e-06, "loss": 0.7049, "step": 5490 }, { "epoch": 11.0, "eval_loss": 0.6989492177963257, "eval_map": 0.4204, "eval_map_50": 0.5653, "eval_map_75": 0.5121, "eval_map_chicken": 0.5406, "eval_map_duck": 0.0, "eval_map_large": 0.7752, "eval_map_medium": 0.4022, "eval_map_plant": 0.7205, "eval_map_small": 0.0859, "eval_mar_1": 0.1439, "eval_mar_10": 0.4952, "eval_mar_100": 0.499, "eval_mar_100_chicken": 0.7182, "eval_mar_100_duck": 0.0, "eval_mar_100_plant": 0.7787, "eval_mar_large": 0.8293, "eval_mar_medium": 0.4863, "eval_mar_small": 0.1458, "eval_runtime": 5.0962, "eval_samples_per_second": 19.622, "eval_steps_per_second": 2.551, "step": 5500 }, { "epoch": 11.04, "grad_norm": 92.46695709228516, "learning_rate": 9.18764020021071e-06, "loss": 0.6504, "step": 5520 }, { "epoch": 11.1, "grad_norm": 28.806991577148438, "learning_rate": 9.179036806841352e-06, "loss": 0.6896, "step": 5550 }, { "epoch": 11.16, "grad_norm": 48.64046859741211, "learning_rate": 9.170392168065858e-06, "loss": 0.7909, "step": 5580 }, { "epoch": 11.22, "grad_norm": 84.09498596191406, "learning_rate": 9.161706369203319e-06, "loss": 0.714, "step": 5610 }, { "epoch": 11.28, "grad_norm": 73.94583129882812, "learning_rate": 9.152979495979064e-06, "loss": 0.5829, "step": 5640 }, { "epoch": 11.34, "grad_norm": 71.72589874267578, "learning_rate": 9.14421163452381e-06, "loss": 0.59, "step": 5670 }, { "epoch": 11.4, "grad_norm": 415.1078796386719, "learning_rate": 9.13540287137281e-06, "loss": 0.7187, "step": 5700 }, { "epoch": 11.46, "grad_norm": 48.62983322143555, "learning_rate": 9.126553293465e-06, "loss": 0.8666, "step": 5730 }, { "epoch": 11.52, "grad_norm": 36.73117446899414, "learning_rate": 9.117662988142138e-06, "loss": 0.916, "step": 5760 }, { "epoch": 11.58, "grad_norm": 115.80775451660156, "learning_rate": 9.108732043147952e-06, "loss": 0.7241, "step": 5790 }, { "epoch": 11.64, "grad_norm": 77.43502807617188, "learning_rate": 9.099760546627262e-06, "loss": 0.6617, "step": 5820 }, { "epoch": 11.7, "grad_norm": 31.340518951416016, "learning_rate": 9.090748587125118e-06, "loss": 0.7765, "step": 5850 }, { "epoch": 11.76, "grad_norm": 34.73516845703125, "learning_rate": 9.08169625358592e-06, "loss": 0.6421, "step": 5880 }, { "epoch": 11.82, "grad_norm": 50.42566680908203, "learning_rate": 9.072603635352548e-06, "loss": 0.8824, "step": 5910 }, { "epoch": 11.88, "grad_norm": 61.33326721191406, "learning_rate": 9.06347082216547e-06, "loss": 0.8302, "step": 5940 }, { "epoch": 11.94, "grad_norm": 94.31954193115234, "learning_rate": 9.054297904161868e-06, "loss": 0.7238, "step": 5970 }, { "epoch": 12.0, "grad_norm": 241.52101135253906, "learning_rate": 9.045084971874738e-06, "loss": 0.7244, "step": 6000 }, { "epoch": 12.0, "eval_loss": 0.6310720443725586, "eval_map": 0.4276, "eval_map_50": 0.584, "eval_map_75": 0.5016, "eval_map_chicken": 0.5447, "eval_map_duck": 0.0, "eval_map_large": 0.7945, "eval_map_medium": 0.4104, "eval_map_plant": 0.7382, "eval_map_small": 0.0749, "eval_mar_1": 0.1445, "eval_mar_10": 0.4989, "eval_mar_100": 0.5035, "eval_mar_100_chicken": 0.7133, "eval_mar_100_duck": 0.0, "eval_mar_100_plant": 0.7971, "eval_mar_large": 0.8515, "eval_mar_medium": 0.4876, "eval_mar_small": 0.1542, "eval_runtime": 5.0099, "eval_samples_per_second": 19.961, "eval_steps_per_second": 2.595, "step": 6000 }, { "epoch": 12.06, "grad_norm": 116.31084442138672, "learning_rate": 9.035832116232002e-06, "loss": 0.5482, "step": 6030 }, { "epoch": 12.12, "grad_norm": 65.95005798339844, "learning_rate": 9.026539428555609e-06, "loss": 0.6084, "step": 6060 }, { "epoch": 12.18, "grad_norm": 59.240360260009766, "learning_rate": 9.017207000560639e-06, "loss": 0.6436, "step": 6090 }, { "epoch": 12.24, "grad_norm": 117.28052520751953, "learning_rate": 9.007834924354384e-06, "loss": 0.7394, "step": 6120 }, { "epoch": 12.3, "grad_norm": 54.573299407958984, "learning_rate": 8.998423292435455e-06, "loss": 0.746, "step": 6150 }, { "epoch": 12.36, "grad_norm": 59.95296096801758, "learning_rate": 8.988972197692857e-06, "loss": 0.7718, "step": 6180 }, { "epoch": 12.42, "grad_norm": 27.571857452392578, "learning_rate": 8.97948173340508e-06, "loss": 0.7943, "step": 6210 }, { "epoch": 12.48, "grad_norm": 180.5658416748047, "learning_rate": 8.969951993239177e-06, "loss": 0.7434, "step": 6240 }, { "epoch": 12.54, "grad_norm": 89.40031433105469, "learning_rate": 8.960383071249837e-06, "loss": 0.6528, "step": 6270 }, { "epoch": 12.6, "grad_norm": 84.45803833007812, "learning_rate": 8.950775061878453e-06, "loss": 0.6857, "step": 6300 }, { "epoch": 12.66, "grad_norm": 73.63268280029297, "learning_rate": 8.9411280599522e-06, "loss": 0.7559, "step": 6330 }, { "epoch": 12.72, "grad_norm": 0.0037382396403700113, "learning_rate": 8.931442160683094e-06, "loss": 0.6612, "step": 6360 }, { "epoch": 12.78, "grad_norm": 120.78377532958984, "learning_rate": 8.921717459667052e-06, "loss": 0.7691, "step": 6390 }, { "epoch": 12.84, "grad_norm": 30.826618194580078, "learning_rate": 8.911954052882941e-06, "loss": 0.7987, "step": 6420 }, { "epoch": 12.9, "grad_norm": 40.72140884399414, "learning_rate": 8.902152036691649e-06, "loss": 0.8032, "step": 6450 }, { "epoch": 12.96, "grad_norm": 34.382293701171875, "learning_rate": 8.892311507835118e-06, "loss": 0.683, "step": 6480 }, { "epoch": 13.0, "eval_loss": 0.6243864893913269, "eval_map": 0.4371, "eval_map_50": 0.5962, "eval_map_75": 0.5288, "eval_map_chicken": 0.5784, "eval_map_duck": 0.0, "eval_map_large": 0.7935, "eval_map_medium": 0.4149, "eval_map_plant": 0.7329, "eval_map_small": 0.0877, "eval_mar_1": 0.1447, "eval_mar_10": 0.5002, "eval_mar_100": 0.5031, "eval_mar_100_chicken": 0.7244, "eval_mar_100_duck": 0.0, "eval_mar_100_plant": 0.7847, "eval_mar_large": 0.8427, "eval_mar_medium": 0.486, "eval_mar_small": 0.1312, "eval_runtime": 4.9066, "eval_samples_per_second": 20.381, "eval_steps_per_second": 2.649, "step": 6500 }, { "epoch": 13.02, "grad_norm": 49.30002975463867, "learning_rate": 8.882432563435394e-06, "loss": 0.7653, "step": 6510 }, { "epoch": 13.08, "grad_norm": 0.010997344739735126, "learning_rate": 8.872515300993669e-06, "loss": 0.6646, "step": 6540 }, { "epoch": 13.14, "grad_norm": 65.29388427734375, "learning_rate": 8.862559818389322e-06, "loss": 0.6705, "step": 6570 }, { "epoch": 13.2, "grad_norm": 56.85333251953125, "learning_rate": 8.852566213878947e-06, "loss": 0.7125, "step": 6600 }, { "epoch": 13.26, "grad_norm": 79.7491226196289, "learning_rate": 8.842534586095383e-06, "loss": 0.6535, "step": 6630 }, { "epoch": 13.32, "grad_norm": 59.6799430847168, "learning_rate": 8.83246503404675e-06, "loss": 0.6035, "step": 6660 }, { "epoch": 13.38, "grad_norm": 96.64356231689453, "learning_rate": 8.82235765711546e-06, "loss": 0.6654, "step": 6690 }, { "epoch": 13.44, "grad_norm": 91.82725524902344, "learning_rate": 8.81221255505724e-06, "loss": 0.6695, "step": 6720 }, { "epoch": 13.5, "grad_norm": 36.14399719238281, "learning_rate": 8.802029828000157e-06, "loss": 0.8221, "step": 6750 }, { "epoch": 13.56, "grad_norm": 46.07867431640625, "learning_rate": 8.791809576443611e-06, "loss": 0.7196, "step": 6780 }, { "epoch": 13.62, "grad_norm": 22.723224639892578, "learning_rate": 8.78155190125736e-06, "loss": 0.717, "step": 6810 }, { "epoch": 13.68, "grad_norm": 186.8100128173828, "learning_rate": 8.77125690368052e-06, "loss": 0.805, "step": 6840 }, { "epoch": 13.74, "grad_norm": 52.61324691772461, "learning_rate": 8.760924685320558e-06, "loss": 0.645, "step": 6870 }, { "epoch": 13.8, "grad_norm": 0.00226211897097528, "learning_rate": 8.750555348152299e-06, "loss": 0.6038, "step": 6900 }, { "epoch": 13.86, "grad_norm": 46.638126373291016, "learning_rate": 8.740148994516912e-06, "loss": 0.6805, "step": 6930 }, { "epoch": 13.92, "grad_norm": 32.8173942565918, "learning_rate": 8.729705727120911e-06, "loss": 0.6252, "step": 6960 }, { "epoch": 13.98, "grad_norm": 45.916847229003906, "learning_rate": 8.719225649035126e-06, "loss": 0.6541, "step": 6990 }, { "epoch": 14.0, "eval_loss": 0.554333508014679, "eval_map": 0.4719, "eval_map_50": 0.6191, "eval_map_75": 0.5555, "eval_map_chicken": 0.6567, "eval_map_duck": 0.0, "eval_map_large": 0.8231, "eval_map_medium": 0.4525, "eval_map_plant": 0.759, "eval_map_small": 0.0712, "eval_mar_1": 0.1494, "eval_mar_10": 0.5195, "eval_mar_100": 0.5249, "eval_mar_100_chicken": 0.7644, "eval_mar_100_duck": 0.0, "eval_mar_100_plant": 0.8104, "eval_mar_large": 0.8715, "eval_mar_medium": 0.5025, "eval_mar_small": 0.1896, "eval_runtime": 5.164, "eval_samples_per_second": 19.365, "eval_steps_per_second": 2.517, "step": 7000 }, { "epoch": 14.04, "grad_norm": 48.85868835449219, "learning_rate": 8.708708863693696e-06, "loss": 0.5773, "step": 7020 }, { "epoch": 14.1, "grad_norm": 443.4310607910156, "learning_rate": 8.69815547489305e-06, "loss": 0.6889, "step": 7050 }, { "epoch": 14.16, "grad_norm": 0.0019413733389228582, "learning_rate": 8.68756558679087e-06, "loss": 0.6352, "step": 7080 }, { "epoch": 14.22, "grad_norm": 66.77024841308594, "learning_rate": 8.67693930390508e-06, "loss": 0.9123, "step": 7110 }, { "epoch": 14.28, "grad_norm": 229.13998413085938, "learning_rate": 8.666276731112802e-06, "loss": 0.721, "step": 7140 }, { "epoch": 14.34, "grad_norm": 56.66972351074219, "learning_rate": 8.655577973649322e-06, "loss": 0.6267, "step": 7170 }, { "epoch": 14.4, "grad_norm": 54.61463928222656, "learning_rate": 8.644843137107058e-06, "loss": 0.725, "step": 7200 }, { "epoch": 14.46, "grad_norm": 40.25044250488281, "learning_rate": 8.634072327434515e-06, "loss": 0.5895, "step": 7230 }, { "epoch": 14.52, "grad_norm": 59.81513595581055, "learning_rate": 8.623265650935233e-06, "loss": 0.6714, "step": 7260 }, { "epoch": 14.58, "grad_norm": 49.08866882324219, "learning_rate": 8.612423214266749e-06, "loss": 0.6454, "step": 7290 }, { "epoch": 14.64, "grad_norm": 47.70410919189453, "learning_rate": 8.601545124439535e-06, "loss": 0.6701, "step": 7320 }, { "epoch": 14.7, "grad_norm": 50.41656494140625, "learning_rate": 8.590631488815945e-06, "loss": 0.6167, "step": 7350 }, { "epoch": 14.76, "grad_norm": 37.03781509399414, "learning_rate": 8.579682415109156e-06, "loss": 0.6049, "step": 7380 }, { "epoch": 14.82, "grad_norm": 59.566505432128906, "learning_rate": 8.568698011382108e-06, "loss": 0.8524, "step": 7410 }, { "epoch": 14.88, "grad_norm": 49.214229583740234, "learning_rate": 8.557678386046429e-06, "loss": 0.6073, "step": 7440 }, { "epoch": 14.94, "grad_norm": 54.74986267089844, "learning_rate": 8.54662364786137e-06, "loss": 0.7139, "step": 7470 }, { "epoch": 15.0, "grad_norm": 0.0027110481169074774, "learning_rate": 8.535533905932739e-06, "loss": 0.6219, "step": 7500 }, { "epoch": 15.0, "eval_loss": 0.5367693305015564, "eval_map": 0.4754, "eval_map_50": 0.6197, "eval_map_75": 0.5553, "eval_map_chicken": 0.6691, "eval_map_duck": 0.0, "eval_map_large": 0.825, "eval_map_medium": 0.4584, "eval_map_plant": 0.7571, "eval_map_small": 0.0764, "eval_mar_1": 0.1528, "eval_mar_10": 0.5216, "eval_mar_100": 0.5265, "eval_mar_100_chicken": 0.7724, "eval_mar_100_duck": 0.0, "eval_mar_100_plant": 0.8072, "eval_mar_large": 0.8711, "eval_mar_medium": 0.5038, "eval_mar_small": 0.1688, "eval_runtime": 5.029, "eval_samples_per_second": 19.885, "eval_steps_per_second": 2.585, "step": 7500 }, { "epoch": 15.06, "grad_norm": 101.3479995727539, "learning_rate": 8.524409269711808e-06, "loss": 0.6541, "step": 7530 }, { "epoch": 15.12, "grad_norm": 32.30617141723633, "learning_rate": 8.513249848994248e-06, "loss": 0.7145, "step": 7560 }, { "epoch": 15.18, "grad_norm": 118.48365783691406, "learning_rate": 8.502055753919033e-06, "loss": 0.6418, "step": 7590 }, { "epoch": 15.24, "grad_norm": 146.08511352539062, "learning_rate": 8.490827094967364e-06, "loss": 0.5815, "step": 7620 }, { "epoch": 15.3, "grad_norm": 74.51444244384766, "learning_rate": 8.479563982961572e-06, "loss": 0.6067, "step": 7650 }, { "epoch": 15.36, "grad_norm": 71.7569580078125, "learning_rate": 8.468266529064025e-06, "loss": 0.6352, "step": 7680 }, { "epoch": 15.42, "grad_norm": 63.288089752197266, "learning_rate": 8.456934844776033e-06, "loss": 0.7251, "step": 7710 }, { "epoch": 15.48, "grad_norm": 52.670902252197266, "learning_rate": 8.445569041936743e-06, "loss": 0.755, "step": 7740 }, { "epoch": 15.54, "grad_norm": 154.50787353515625, "learning_rate": 8.434169232722043e-06, "loss": 0.5829, "step": 7770 }, { "epoch": 15.6, "grad_norm": 72.39775085449219, "learning_rate": 8.422735529643445e-06, "loss": 0.6424, "step": 7800 }, { "epoch": 15.66, "grad_norm": 189.01527404785156, "learning_rate": 8.411268045546984e-06, "loss": 0.6285, "step": 7830 }, { "epoch": 15.72, "grad_norm": 113.38286590576172, "learning_rate": 8.399766893612096e-06, "loss": 0.6086, "step": 7860 }, { "epoch": 15.78, "grad_norm": 22.89063262939453, "learning_rate": 8.388232187350513e-06, "loss": 0.6352, "step": 7890 }, { "epoch": 15.84, "grad_norm": 29.94500160217285, "learning_rate": 8.376664040605122e-06, "loss": 0.7657, "step": 7920 }, { "epoch": 15.9, "grad_norm": 67.85516357421875, "learning_rate": 8.365062567548868e-06, "loss": 0.7562, "step": 7950 }, { "epoch": 15.96, "grad_norm": 173.4965057373047, "learning_rate": 8.353427882683601e-06, "loss": 0.5842, "step": 7980 }, { "epoch": 16.0, "eval_loss": 0.5324800610542297, "eval_map": 0.4778, "eval_map_50": 0.6269, "eval_map_75": 0.5668, "eval_map_chicken": 0.6922, "eval_map_duck": 0.0, "eval_map_large": 0.8015, "eval_map_medium": 0.4558, "eval_map_plant": 0.7412, "eval_map_small": 0.1147, "eval_mar_1": 0.1501, "eval_mar_10": 0.5178, "eval_mar_100": 0.5218, "eval_mar_100_chicken": 0.7636, "eval_mar_100_duck": 0.0, "eval_mar_100_plant": 0.8017, "eval_mar_large": 0.8556, "eval_mar_medium": 0.5071, "eval_mar_small": 0.1604, "eval_runtime": 5.0074, "eval_samples_per_second": 19.971, "eval_steps_per_second": 2.596, "step": 8000 }, { "epoch": 16.02, "grad_norm": 63.686378479003906, "learning_rate": 8.341760100838967e-06, "loss": 0.7119, "step": 8010 }, { "epoch": 16.08, "grad_norm": 34.64134216308594, "learning_rate": 8.33005933717126e-06, "loss": 0.6144, "step": 8040 }, { "epoch": 16.14, "grad_norm": 34.982269287109375, "learning_rate": 8.318325707162293e-06, "loss": 0.6278, "step": 8070 }, { "epoch": 16.2, "grad_norm": 53.49913024902344, "learning_rate": 8.30655932661826e-06, "loss": 0.6089, "step": 8100 }, { "epoch": 16.26, "grad_norm": 118.85201263427734, "learning_rate": 8.294760311668586e-06, "loss": 0.6401, "step": 8130 }, { "epoch": 16.32, "grad_norm": 35.8175048828125, "learning_rate": 8.282928778764783e-06, "loss": 0.5656, "step": 8160 }, { "epoch": 16.38, "grad_norm": 19.808303833007812, "learning_rate": 8.271064844679306e-06, "loss": 0.5821, "step": 8190 }, { "epoch": 16.44, "grad_norm": 62.134803771972656, "learning_rate": 8.259168626504395e-06, "loss": 0.6077, "step": 8220 }, { "epoch": 16.5, "grad_norm": 31.38833999633789, "learning_rate": 8.247240241650918e-06, "loss": 0.5492, "step": 8250 }, { "epoch": 16.56, "grad_norm": 77.07894897460938, "learning_rate": 8.235279807847223e-06, "loss": 0.641, "step": 8280 }, { "epoch": 16.62, "grad_norm": 65.0913314819336, "learning_rate": 8.223287443137957e-06, "loss": 0.5655, "step": 8310 }, { "epoch": 16.68, "grad_norm": 217.502685546875, "learning_rate": 8.211263265882923e-06, "loss": 0.6829, "step": 8340 }, { "epoch": 16.74, "grad_norm": 145.74627685546875, "learning_rate": 8.199207394755892e-06, "loss": 0.664, "step": 8370 }, { "epoch": 16.8, "grad_norm": 61.71194076538086, "learning_rate": 8.18711994874345e-06, "loss": 0.5375, "step": 8400 }, { "epoch": 16.86, "grad_norm": 74.38108825683594, "learning_rate": 8.175001047143804e-06, "loss": 0.6282, "step": 8430 }, { "epoch": 16.92, "grad_norm": 88.76374816894531, "learning_rate": 8.162850809565623e-06, "loss": 0.6561, "step": 8460 }, { "epoch": 16.98, "grad_norm": 82.03018188476562, "learning_rate": 8.150669355926848e-06, "loss": 0.5704, "step": 8490 }, { "epoch": 17.0, "eval_loss": 0.5436572432518005, "eval_map": 0.5192, "eval_map_50": 0.6982, "eval_map_75": 0.6149, "eval_map_chicken": 0.6772, "eval_map_duck": 0.1347, "eval_map_large": 0.8084, "eval_map_medium": 0.5014, "eval_map_plant": 0.7456, "eval_map_small": 0.0616, "eval_mar_1": 0.1798, "eval_mar_10": 0.558, "eval_mar_100": 0.5618, "eval_mar_100_chicken": 0.7449, "eval_mar_100_duck": 0.1412, "eval_mar_100_plant": 0.7994, "eval_mar_large": 0.8644, "eval_mar_medium": 0.5445, "eval_mar_small": 0.1521, "eval_runtime": 5.0124, "eval_samples_per_second": 19.95, "eval_steps_per_second": 2.594, "step": 8500 }, { "epoch": 17.04, "grad_norm": 106.79338073730469, "learning_rate": 8.138456806453503e-06, "loss": 0.7365, "step": 8520 }, { "epoch": 17.1, "grad_norm": 79.06564331054688, "learning_rate": 8.126213281678527e-06, "loss": 0.6555, "step": 8550 }, { "epoch": 17.16, "grad_norm": 31.134279251098633, "learning_rate": 8.113938902440563e-06, "loss": 0.5704, "step": 8580 }, { "epoch": 17.22, "grad_norm": 52.495059967041016, "learning_rate": 8.101633789882781e-06, "loss": 0.6709, "step": 8610 }, { "epoch": 17.28, "grad_norm": 45.442081451416016, "learning_rate": 8.089298065451673e-06, "loss": 0.5955, "step": 8640 }, { "epoch": 17.34, "grad_norm": 71.86921691894531, "learning_rate": 8.076931850895858e-06, "loss": 0.6332, "step": 8670 }, { "epoch": 17.4, "grad_norm": 61.51048278808594, "learning_rate": 8.064535268264883e-06, "loss": 0.6525, "step": 8700 }, { "epoch": 17.46, "grad_norm": 71.84506225585938, "learning_rate": 8.052108439908014e-06, "loss": 0.5134, "step": 8730 }, { "epoch": 17.52, "grad_norm": 58.42548370361328, "learning_rate": 8.039651488473028e-06, "loss": 0.6082, "step": 8760 }, { "epoch": 17.58, "grad_norm": 58.07726287841797, "learning_rate": 8.027164536905008e-06, "loss": 0.581, "step": 8790 }, { "epoch": 17.64, "grad_norm": 167.6965789794922, "learning_rate": 8.014647708445124e-06, "loss": 0.5426, "step": 8820 }, { "epoch": 17.7, "grad_norm": 37.38274383544922, "learning_rate": 8.002101126629422e-06, "loss": 0.5913, "step": 8850 }, { "epoch": 17.76, "grad_norm": 63.516876220703125, "learning_rate": 7.989524915287595e-06, "loss": 0.6801, "step": 8880 }, { "epoch": 17.82, "grad_norm": 48.16976547241211, "learning_rate": 7.976919198541775e-06, "loss": 0.5655, "step": 8910 }, { "epoch": 17.88, "grad_norm": 85.60452270507812, "learning_rate": 7.964284100805297e-06, "loss": 0.6774, "step": 8940 }, { "epoch": 17.94, "grad_norm": 56.792022705078125, "learning_rate": 7.951619746781474e-06, "loss": 0.6201, "step": 8970 }, { "epoch": 18.0, "grad_norm": 60.09886932373047, "learning_rate": 7.938926261462366e-06, "loss": 0.5683, "step": 9000 }, { "epoch": 18.0, "eval_loss": 0.5067680478096008, "eval_map": 0.6324, "eval_map_50": 0.8451, "eval_map_75": 0.7659, "eval_map_chicken": 0.6996, "eval_map_duck": 0.4404, "eval_map_large": 0.8208, "eval_map_medium": 0.6253, "eval_map_plant": 0.7573, "eval_map_small": 0.0963, "eval_mar_1": 0.225, "eval_mar_10": 0.6739, "eval_mar_100": 0.6793, "eval_mar_100_chicken": 0.7573, "eval_mar_100_duck": 0.4753, "eval_mar_100_plant": 0.8052, "eval_mar_large": 0.8628, "eval_mar_medium": 0.6808, "eval_mar_small": 0.175, "eval_runtime": 5.0071, "eval_samples_per_second": 19.971, "eval_steps_per_second": 2.596, "step": 9000 }, { "epoch": 18.06, "grad_norm": 66.6285400390625, "learning_rate": 7.926203770127552e-06, "loss": 0.5579, "step": 9030 }, { "epoch": 18.12, "grad_norm": 127.3472671508789, "learning_rate": 7.913452398342882e-06, "loss": 0.5633, "step": 9060 }, { "epoch": 18.18, "grad_norm": 70.93628692626953, "learning_rate": 7.900672271959247e-06, "loss": 0.6412, "step": 9090 }, { "epoch": 18.24, "grad_norm": 81.13060760498047, "learning_rate": 7.887863517111337e-06, "loss": 0.6309, "step": 9120 }, { "epoch": 18.3, "grad_norm": 66.56903839111328, "learning_rate": 7.875026260216395e-06, "loss": 0.5713, "step": 9150 }, { "epoch": 18.36, "grad_norm": 49.273643493652344, "learning_rate": 7.862160627972956e-06, "loss": 0.5789, "step": 9180 }, { "epoch": 18.42, "grad_norm": 36.204036712646484, "learning_rate": 7.849266747359619e-06, "loss": 0.6162, "step": 9210 }, { "epoch": 18.48, "grad_norm": 55.067718505859375, "learning_rate": 7.836344745633785e-06, "loss": 0.6287, "step": 9240 }, { "epoch": 18.54, "grad_norm": 96.10171508789062, "learning_rate": 7.823394750330386e-06, "loss": 0.6219, "step": 9270 }, { "epoch": 18.6, "grad_norm": 47.33934783935547, "learning_rate": 7.810416889260653e-06, "loss": 0.7037, "step": 9300 }, { "epoch": 18.66, "grad_norm": 97.90437316894531, "learning_rate": 7.797411290510836e-06, "loss": 0.5965, "step": 9330 }, { "epoch": 18.72, "grad_norm": 36.546260833740234, "learning_rate": 7.78437808244094e-06, "loss": 0.5984, "step": 9360 }, { "epoch": 18.78, "grad_norm": 46.64151382446289, "learning_rate": 7.771317393683471e-06, "loss": 0.532, "step": 9390 }, { "epoch": 18.84, "grad_norm": 102.95185852050781, "learning_rate": 7.758229353142153e-06, "loss": 0.6825, "step": 9420 }, { "epoch": 18.9, "grad_norm": 53.53539276123047, "learning_rate": 7.74511408999066e-06, "loss": 0.6691, "step": 9450 }, { "epoch": 18.96, "grad_norm": 83.08556365966797, "learning_rate": 7.731971733671347e-06, "loss": 0.6402, "step": 9480 }, { "epoch": 19.0, "eval_loss": 0.46823224425315857, "eval_map": 0.6741, "eval_map_50": 0.8823, "eval_map_75": 0.8298, "eval_map_chicken": 0.7195, "eval_map_duck": 0.5335, "eval_map_large": 0.8274, "eval_map_medium": 0.6748, "eval_map_plant": 0.7691, "eval_map_small": 0.1357, "eval_mar_1": 0.2516, "eval_mar_10": 0.7135, "eval_mar_100": 0.7185, "eval_mar_100_chicken": 0.7698, "eval_mar_100_duck": 0.567, "eval_mar_100_plant": 0.8187, "eval_mar_large": 0.8728, "eval_mar_medium": 0.7246, "eval_mar_small": 0.2104, "eval_runtime": 5.1062, "eval_samples_per_second": 19.584, "eval_steps_per_second": 2.546, "step": 9500 }, { "epoch": 19.02, "grad_norm": 54.46965408325195, "learning_rate": 7.718802413893963e-06, "loss": 0.6762, "step": 9510 }, { "epoch": 19.08, "grad_norm": 101.3377685546875, "learning_rate": 7.70560626063438e-06, "loss": 0.5893, "step": 9540 }, { "epoch": 19.14, "grad_norm": 54.880916595458984, "learning_rate": 7.692383404133302e-06, "loss": 0.5074, "step": 9570 }, { "epoch": 19.2, "grad_norm": 60.68124771118164, "learning_rate": 7.679133974894984e-06, "loss": 0.5336, "step": 9600 }, { "epoch": 19.26, "grad_norm": 26.069740295410156, "learning_rate": 7.665858103685944e-06, "loss": 0.5209, "step": 9630 }, { "epoch": 19.32, "grad_norm": 79.79200744628906, "learning_rate": 7.652555921533671e-06, "loss": 0.5702, "step": 9660 }, { "epoch": 19.38, "grad_norm": 208.93028259277344, "learning_rate": 7.639227559725333e-06, "loss": 0.6033, "step": 9690 }, { "epoch": 19.44, "grad_norm": 32.772396087646484, "learning_rate": 7.6258731498064796e-06, "loss": 0.5473, "step": 9720 }, { "epoch": 19.5, "grad_norm": 62.062557220458984, "learning_rate": 7.612492823579744e-06, "loss": 0.6168, "step": 9750 }, { "epoch": 19.56, "grad_norm": 46.67622375488281, "learning_rate": 7.5990867131035474e-06, "loss": 0.5714, "step": 9780 }, { "epoch": 19.62, "grad_norm": 58.50261306762695, "learning_rate": 7.585654950690786e-06, "loss": 0.5411, "step": 9810 }, { "epoch": 19.68, "grad_norm": 0.0009975264547392726, "learning_rate": 7.572197668907533e-06, "loss": 0.5943, "step": 9840 }, { "epoch": 19.74, "grad_norm": 37.597755432128906, "learning_rate": 7.5587150005717256e-06, "loss": 0.6523, "step": 9870 }, { "epoch": 19.8, "grad_norm": 46.372833251953125, "learning_rate": 7.545207078751858e-06, "loss": 0.5803, "step": 9900 }, { "epoch": 19.86, "grad_norm": 53.04841995239258, "learning_rate": 7.531674036765662e-06, "loss": 0.6232, "step": 9930 }, { "epoch": 19.92, "grad_norm": 49.54397964477539, "learning_rate": 7.518116008178805e-06, "loss": 0.5833, "step": 9960 }, { "epoch": 19.98, "grad_norm": 93.43566131591797, "learning_rate": 7.5045331268035505e-06, "loss": 0.5664, "step": 9990 }, { "epoch": 20.0, "eval_loss": 0.4792620539665222, "eval_map": 0.6841, "eval_map_50": 0.9057, "eval_map_75": 0.8277, "eval_map_chicken": 0.7325, "eval_map_duck": 0.5558, "eval_map_large": 0.8164, "eval_map_medium": 0.6878, "eval_map_plant": 0.7638, "eval_map_small": 0.135, "eval_mar_1": 0.2585, "eval_mar_10": 0.7299, "eval_mar_100": 0.7341, "eval_mar_100_chicken": 0.7853, "eval_mar_100_duck": 0.5979, "eval_mar_100_plant": 0.819, "eval_mar_large": 0.8649, "eval_mar_medium": 0.7463, "eval_mar_small": 0.2396, "eval_runtime": 5.1021, "eval_samples_per_second": 19.6, "eval_steps_per_second": 2.548, "step": 10000 }, { "epoch": 20.04, "grad_norm": 97.10029602050781, "learning_rate": 7.490925526697455e-06, "loss": 0.5375, "step": 10020 }, { "epoch": 20.1, "grad_norm": 34.54094696044922, "learning_rate": 7.477293342162038e-06, "loss": 0.5242, "step": 10050 }, { "epoch": 20.16, "grad_norm": 74.18828582763672, "learning_rate": 7.463636707741458e-06, "loss": 0.4776, "step": 10080 }, { "epoch": 20.22, "grad_norm": 61.5256233215332, "learning_rate": 7.449955758221184e-06, "loss": 0.5529, "step": 10110 }, { "epoch": 20.28, "grad_norm": 390.4728088378906, "learning_rate": 7.436250628626662e-06, "loss": 0.6218, "step": 10140 }, { "epoch": 20.34, "grad_norm": 68.62318420410156, "learning_rate": 7.42252145422199e-06, "loss": 0.5621, "step": 10170 }, { "epoch": 20.4, "grad_norm": 44.162994384765625, "learning_rate": 7.408768370508577e-06, "loss": 0.5153, "step": 10200 }, { "epoch": 20.46, "grad_norm": 65.52782440185547, "learning_rate": 7.394991513223806e-06, "loss": 0.5388, "step": 10230 }, { "epoch": 20.52, "grad_norm": 31.844987869262695, "learning_rate": 7.381191018339697e-06, "loss": 0.4896, "step": 10260 }, { "epoch": 20.58, "grad_norm": 53.01321792602539, "learning_rate": 7.3673670220615615e-06, "loss": 0.5244, "step": 10290 }, { "epoch": 20.64, "grad_norm": 47.084693908691406, "learning_rate": 7.353519660826665e-06, "loss": 0.9178, "step": 10320 }, { "epoch": 20.7, "grad_norm": 91.9738540649414, "learning_rate": 7.3396490713028674e-06, "loss": 0.5282, "step": 10350 }, { "epoch": 20.76, "grad_norm": 79.40870666503906, "learning_rate": 7.325755390387293e-06, "loss": 0.5952, "step": 10380 }, { "epoch": 20.82, "grad_norm": 91.8105239868164, "learning_rate": 7.31183875520496e-06, "loss": 0.6473, "step": 10410 }, { "epoch": 20.88, "grad_norm": 51.59716796875, "learning_rate": 7.297899303107441e-06, "loss": 0.5078, "step": 10440 }, { "epoch": 20.94, "grad_norm": 66.34852600097656, "learning_rate": 7.283937171671498e-06, "loss": 0.4993, "step": 10470 }, { "epoch": 21.0, "grad_norm": 51.79935836791992, "learning_rate": 7.269952498697734e-06, "loss": 0.4411, "step": 10500 }, { "epoch": 21.0, "eval_loss": 0.44476136565208435, "eval_map": 0.7042, "eval_map_50": 0.932, "eval_map_75": 0.8592, "eval_map_chicken": 0.7128, "eval_map_duck": 0.6338, "eval_map_large": 0.8287, "eval_map_medium": 0.7039, "eval_map_plant": 0.766, "eval_map_small": 0.1098, "eval_mar_1": 0.2789, "eval_mar_10": 0.7527, "eval_mar_100": 0.7568, "eval_mar_100_chicken": 0.7658, "eval_mar_100_duck": 0.6845, "eval_mar_100_plant": 0.8202, "eval_mar_large": 0.8749, "eval_mar_medium": 0.7703, "eval_mar_small": 0.1718, "eval_runtime": 5.4795, "eval_samples_per_second": 18.25, "eval_steps_per_second": 2.372, "step": 10500 }, { "epoch": 21.06, "grad_norm": 52.99646759033203, "learning_rate": 7.2559454222092265e-06, "loss": 0.5123, "step": 10530 }, { "epoch": 21.12, "grad_norm": 35.29424285888672, "learning_rate": 7.241916080450163e-06, "loss": 0.5506, "step": 10560 }, { "epoch": 21.18, "grad_norm": 43.816009521484375, "learning_rate": 7.227864611884483e-06, "loss": 0.5644, "step": 10590 }, { "epoch": 21.24, "grad_norm": 106.69770812988281, "learning_rate": 7.21379115519451e-06, "loss": 0.5914, "step": 10620 }, { "epoch": 21.3, "grad_norm": 714.3410034179688, "learning_rate": 7.199695849279576e-06, "loss": 0.4671, "step": 10650 }, { "epoch": 21.36, "grad_norm": 40.27183532714844, "learning_rate": 7.185578833254665e-06, "loss": 0.5317, "step": 10680 }, { "epoch": 21.42, "grad_norm": 63.30058670043945, "learning_rate": 7.171440246449024e-06, "loss": 0.5063, "step": 10710 }, { "epoch": 21.48, "grad_norm": 31.39018440246582, "learning_rate": 7.157280228404796e-06, "loss": 0.5745, "step": 10740 }, { "epoch": 21.54, "grad_norm": 41.66950225830078, "learning_rate": 7.143098918875643e-06, "loss": 0.5368, "step": 10770 }, { "epoch": 21.6, "grad_norm": 75.50695037841797, "learning_rate": 7.128896457825364e-06, "loss": 0.6055, "step": 10800 }, { "epoch": 21.66, "grad_norm": 43.1558837890625, "learning_rate": 7.114672985426516e-06, "loss": 0.5593, "step": 10830 }, { "epoch": 21.72, "grad_norm": 39.317481994628906, "learning_rate": 7.100428642059033e-06, "loss": 0.5486, "step": 10860 }, { "epoch": 21.78, "grad_norm": 47.37519073486328, "learning_rate": 7.086163568308828e-06, "loss": 0.5348, "step": 10890 }, { "epoch": 21.84, "grad_norm": 109.30632781982422, "learning_rate": 7.071877904966422e-06, "loss": 0.5404, "step": 10920 }, { "epoch": 21.9, "grad_norm": 57.96327209472656, "learning_rate": 7.057571793025545e-06, "loss": 0.5283, "step": 10950 }, { "epoch": 21.96, "grad_norm": 97.8825454711914, "learning_rate": 7.043245373681746e-06, "loss": 0.6106, "step": 10980 }, { "epoch": 22.0, "eval_loss": 0.41423293948173523, "eval_map": 0.7307, "eval_map_50": 0.9307, "eval_map_75": 0.8797, "eval_map_chicken": 0.7379, "eval_map_duck": 0.6726, "eval_map_large": 0.8381, "eval_map_medium": 0.735, "eval_map_plant": 0.7817, "eval_map_small": 0.0773, "eval_mar_1": 0.2841, "eval_mar_10": 0.7736, "eval_mar_100": 0.7783, "eval_mar_100_chicken": 0.7853, "eval_mar_100_duck": 0.7134, "eval_mar_100_plant": 0.836, "eval_mar_large": 0.8866, "eval_mar_medium": 0.7946, "eval_mar_small": 0.2062, "eval_runtime": 5.0811, "eval_samples_per_second": 19.681, "eval_steps_per_second": 2.559, "step": 11000 }, { "epoch": 22.02, "grad_norm": 94.26522827148438, "learning_rate": 7.028898788331e-06, "loss": 0.5071, "step": 11010 }, { "epoch": 22.08, "grad_norm": 105.05602264404297, "learning_rate": 7.014532178568314e-06, "loss": 0.465, "step": 11040 }, { "epoch": 22.14, "grad_norm": 51.92534255981445, "learning_rate": 7.0001456861863236e-06, "loss": 0.5546, "step": 11070 }, { "epoch": 22.2, "grad_norm": 29.79014778137207, "learning_rate": 6.985739453173903e-06, "loss": 0.4825, "step": 11100 }, { "epoch": 22.26, "grad_norm": 80.56990814208984, "learning_rate": 6.971313621714756e-06, "loss": 0.5229, "step": 11130 }, { "epoch": 22.32, "grad_norm": 68.52033996582031, "learning_rate": 6.9568683341860135e-06, "loss": 0.5771, "step": 11160 }, { "epoch": 22.38, "grad_norm": 42.956085205078125, "learning_rate": 6.942403733156832e-06, "loss": 0.5977, "step": 11190 }, { "epoch": 22.44, "grad_norm": 62.62834548950195, "learning_rate": 6.927919961386984e-06, "loss": 0.5419, "step": 11220 }, { "epoch": 22.5, "grad_norm": 39.22291564941406, "learning_rate": 6.913417161825449e-06, "loss": 0.5346, "step": 11250 }, { "epoch": 22.56, "grad_norm": 21.985593795776367, "learning_rate": 6.898895477609007e-06, "loss": 0.5946, "step": 11280 }, { "epoch": 22.62, "grad_norm": 77.47394561767578, "learning_rate": 6.884355052060814e-06, "loss": 0.5351, "step": 11310 }, { "epoch": 22.68, "grad_norm": 40.48210906982422, "learning_rate": 6.869796028689002e-06, "loss": 0.5245, "step": 11340 }, { "epoch": 22.74, "grad_norm": 33.53753662109375, "learning_rate": 6.8552185511852555e-06, "loss": 0.4837, "step": 11370 }, { "epoch": 22.8, "grad_norm": 68.7355728149414, "learning_rate": 6.840622763423391e-06, "loss": 0.6208, "step": 11400 }, { "epoch": 22.86, "grad_norm": 71.2813720703125, "learning_rate": 6.82600880945794e-06, "loss": 0.6104, "step": 11430 }, { "epoch": 22.92, "grad_norm": 147.4709930419922, "learning_rate": 6.811376833522729e-06, "loss": 0.4831, "step": 11460 }, { "epoch": 22.98, "grad_norm": 79.54974365234375, "learning_rate": 6.796726980029454e-06, "loss": 0.5243, "step": 11490 }, { "epoch": 23.0, "eval_loss": 0.43533027172088623, "eval_map": 0.7183, "eval_map_50": 0.9406, "eval_map_75": 0.86, "eval_map_chicken": 0.7338, "eval_map_duck": 0.6385, "eval_map_large": 0.8416, "eval_map_medium": 0.7236, "eval_map_plant": 0.7827, "eval_map_small": 0.0901, "eval_mar_1": 0.2827, "eval_mar_10": 0.7615, "eval_mar_100": 0.767, "eval_mar_100_chicken": 0.7827, "eval_mar_100_duck": 0.6845, "eval_mar_100_plant": 0.8337, "eval_mar_large": 0.8879, "eval_mar_medium": 0.779, "eval_mar_small": 0.1973, "eval_runtime": 5.0735, "eval_samples_per_second": 19.71, "eval_steps_per_second": 2.562, "step": 11500 }, { "epoch": 23.04, "grad_norm": 42.534297943115234, "learning_rate": 6.782059393566254e-06, "loss": 0.4992, "step": 11520 }, { "epoch": 23.1, "grad_norm": 0.002314250450581312, "learning_rate": 6.767374218896286e-06, "loss": 0.474, "step": 11550 }, { "epoch": 23.16, "grad_norm": 33.95319366455078, "learning_rate": 6.752671600956295e-06, "loss": 0.5098, "step": 11580 }, { "epoch": 23.22, "grad_norm": 65.58226013183594, "learning_rate": 6.737951684855185e-06, "loss": 0.6279, "step": 11610 }, { "epoch": 23.28, "grad_norm": 38.85221481323242, "learning_rate": 6.723214615872585e-06, "loss": 0.5288, "step": 11640 }, { "epoch": 23.34, "grad_norm": 31.03350067138672, "learning_rate": 6.708460539457418e-06, "loss": 0.5167, "step": 11670 }, { "epoch": 23.4, "grad_norm": 74.7662353515625, "learning_rate": 6.693689601226458e-06, "loss": 0.5782, "step": 11700 }, { "epoch": 23.46, "grad_norm": 30.249208450317383, "learning_rate": 6.6789019469629034e-06, "loss": 0.4759, "step": 11730 }, { "epoch": 23.52, "grad_norm": 32.10087966918945, "learning_rate": 6.664097722614934e-06, "loss": 0.4923, "step": 11760 }, { "epoch": 23.58, "grad_norm": 129.60997009277344, "learning_rate": 6.649277074294265e-06, "loss": 0.5149, "step": 11790 }, { "epoch": 23.64, "grad_norm": 74.41838073730469, "learning_rate": 6.634440148274712e-06, "loss": 0.5063, "step": 11820 }, { "epoch": 23.7, "grad_norm": 37.93177032470703, "learning_rate": 6.619587090990748e-06, "loss": 0.4632, "step": 11850 }, { "epoch": 23.76, "grad_norm": 40.77086639404297, "learning_rate": 6.604718049036047e-06, "loss": 0.5137, "step": 11880 }, { "epoch": 23.82, "grad_norm": 29.192161560058594, "learning_rate": 6.589833169162055e-06, "loss": 0.5527, "step": 11910 }, { "epoch": 23.88, "grad_norm": 86.26991271972656, "learning_rate": 6.574932598276524e-06, "loss": 0.4662, "step": 11940 }, { "epoch": 23.94, "grad_norm": 35.82132339477539, "learning_rate": 6.5600164834420754e-06, "loss": 0.5318, "step": 11970 }, { "epoch": 24.0, "grad_norm": 53.413780212402344, "learning_rate": 6.545084971874738e-06, "loss": 0.5184, "step": 12000 }, { "epoch": 24.0, "eval_loss": 0.4076879024505615, "eval_map": 0.7097, "eval_map_50": 0.9464, "eval_map_75": 0.854, "eval_map_chicken": 0.7126, "eval_map_duck": 0.6338, "eval_map_large": 0.8335, "eval_map_medium": 0.7156, "eval_map_plant": 0.7828, "eval_map_small": 0.1197, "eval_mar_1": 0.2741, "eval_mar_10": 0.757, "eval_mar_100": 0.7607, "eval_mar_100_chicken": 0.7667, "eval_mar_100_duck": 0.6784, "eval_mar_100_plant": 0.8372, "eval_mar_large": 0.8828, "eval_mar_medium": 0.7738, "eval_mar_small": 0.2553, "eval_runtime": 4.9733, "eval_samples_per_second": 20.107, "eval_steps_per_second": 2.614, "step": 12000 }, { "epoch": 24.06, "grad_norm": 52.72776412963867, "learning_rate": 6.530138210942505e-06, "loss": 0.5589, "step": 12030 }, { "epoch": 24.12, "grad_norm": 29.438343048095703, "learning_rate": 6.5151763481638705e-06, "loss": 0.5368, "step": 12060 }, { "epoch": 24.18, "grad_norm": 54.32796859741211, "learning_rate": 6.500199531206381e-06, "loss": 0.5092, "step": 12090 }, { "epoch": 24.24, "grad_norm": 69.30450439453125, "learning_rate": 6.485207907885175e-06, "loss": 0.4992, "step": 12120 }, { "epoch": 24.3, "grad_norm": 42.193634033203125, "learning_rate": 6.47020162616152e-06, "loss": 0.4091, "step": 12150 }, { "epoch": 24.36, "grad_norm": 30.120336532592773, "learning_rate": 6.455180834141359e-06, "loss": 0.471, "step": 12180 }, { "epoch": 24.42, "grad_norm": 30.613067626953125, "learning_rate": 6.440145680073847e-06, "loss": 0.5791, "step": 12210 }, { "epoch": 24.48, "grad_norm": 38.11183166503906, "learning_rate": 6.425096312349881e-06, "loss": 0.4348, "step": 12240 }, { "epoch": 24.54, "grad_norm": 46.21797180175781, "learning_rate": 6.410032879500647e-06, "loss": 0.5827, "step": 12270 }, { "epoch": 24.6, "grad_norm": 39.75735855102539, "learning_rate": 6.3949555301961474e-06, "loss": 0.4915, "step": 12300 }, { "epoch": 24.66, "grad_norm": 55.170345306396484, "learning_rate": 6.3798644132437304e-06, "loss": 0.4253, "step": 12330 }, { "epoch": 24.72, "grad_norm": 30.651851654052734, "learning_rate": 6.364759677586627e-06, "loss": 0.5383, "step": 12360 }, { "epoch": 24.78, "grad_norm": 110.5732421875, "learning_rate": 6.349641472302484e-06, "loss": 0.4379, "step": 12390 }, { "epoch": 24.84, "grad_norm": 37.65018081665039, "learning_rate": 6.334509946601879e-06, "loss": 0.4374, "step": 12420 }, { "epoch": 24.9, "grad_norm": 48.68293762207031, "learning_rate": 6.3193652498268656e-06, "loss": 0.5241, "step": 12450 }, { "epoch": 24.96, "grad_norm": 131.17486572265625, "learning_rate": 6.304207531449486e-06, "loss": 0.4849, "step": 12480 }, { "epoch": 25.0, "eval_loss": 0.4043169915676117, "eval_map": 0.7096, "eval_map_50": 0.949, "eval_map_75": 0.8366, "eval_map_chicken": 0.7483, "eval_map_duck": 0.596, "eval_map_large": 0.8412, "eval_map_medium": 0.7084, "eval_map_plant": 0.7843, "eval_map_small": 0.1234, "eval_mar_1": 0.2739, "eval_mar_10": 0.7538, "eval_mar_100": 0.7611, "eval_mar_100_chicken": 0.7902, "eval_mar_100_duck": 0.6546, "eval_mar_100_plant": 0.8383, "eval_mar_large": 0.8891, "eval_mar_medium": 0.7703, "eval_mar_small": 0.258, "eval_runtime": 5.051, "eval_samples_per_second": 19.798, "eval_steps_per_second": 2.574, "step": 12500 }, { "epoch": 25.02, "grad_norm": 204.19046020507812, "learning_rate": 6.2890369410703e-06, "loss": 0.5097, "step": 12510 }, { "epoch": 25.08, "grad_norm": 104.87467956542969, "learning_rate": 6.273853628416911e-06, "loss": 0.507, "step": 12540 }, { "epoch": 25.14, "grad_norm": 32.947471618652344, "learning_rate": 6.258657743342486e-06, "loss": 0.4753, "step": 12570 }, { "epoch": 25.2, "grad_norm": 35.83731460571289, "learning_rate": 6.243449435824276e-06, "loss": 0.4727, "step": 12600 }, { "epoch": 25.26, "grad_norm": 53.04224395751953, "learning_rate": 6.228228855962133e-06, "loss": 0.5548, "step": 12630 }, { "epoch": 25.32, "grad_norm": 35.74001693725586, "learning_rate": 6.212996153977038e-06, "loss": 0.5208, "step": 12660 }, { "epoch": 25.38, "grad_norm": 45.188846588134766, "learning_rate": 6.1977514802096105e-06, "loss": 0.5547, "step": 12690 }, { "epoch": 25.44, "grad_norm": 58.8617057800293, "learning_rate": 6.182494985118625e-06, "loss": 0.4698, "step": 12720 }, { "epoch": 25.5, "grad_norm": 32.76780700683594, "learning_rate": 6.1672268192795285e-06, "loss": 0.5208, "step": 12750 }, { "epoch": 25.56, "grad_norm": 88.9961929321289, "learning_rate": 6.151947133382954e-06, "loss": 0.5717, "step": 12780 }, { "epoch": 25.62, "grad_norm": 51.27913284301758, "learning_rate": 6.136656078233233e-06, "loss": 0.4076, "step": 12810 }, { "epoch": 25.68, "grad_norm": 127.77012634277344, "learning_rate": 6.121353804746907e-06, "loss": 0.5238, "step": 12840 }, { "epoch": 25.74, "grad_norm": 53.242958068847656, "learning_rate": 6.106040463951237e-06, "loss": 0.5165, "step": 12870 }, { "epoch": 25.8, "grad_norm": 91.68648529052734, "learning_rate": 6.090716206982714e-06, "loss": 0.521, "step": 12900 }, { "epoch": 25.86, "grad_norm": 62.1449089050293, "learning_rate": 6.075381185085568e-06, "loss": 0.4903, "step": 12930 }, { "epoch": 25.92, "grad_norm": 0.0003859973221551627, "learning_rate": 6.060035549610275e-06, "loss": 0.4244, "step": 12960 }, { "epoch": 25.98, "grad_norm": 69.36231994628906, "learning_rate": 6.044679452012059e-06, "loss": 0.5022, "step": 12990 }, { "epoch": 26.0, "eval_loss": 0.3883710503578186, "eval_map": 0.7394, "eval_map_50": 0.9528, "eval_map_75": 0.8847, "eval_map_chicken": 0.7466, "eval_map_duck": 0.688, "eval_map_large": 0.8473, "eval_map_medium": 0.7337, "eval_map_plant": 0.7838, "eval_map_small": 0.1472, "eval_mar_1": 0.2918, "eval_mar_10": 0.7816, "eval_mar_100": 0.7876, "eval_mar_100_chicken": 0.7871, "eval_mar_100_duck": 0.7402, "eval_mar_100_plant": 0.8354, "eval_mar_large": 0.8971, "eval_mar_medium": 0.7888, "eval_mar_small": 0.2549, "eval_runtime": 5.5783, "eval_samples_per_second": 17.927, "eval_steps_per_second": 2.33, "step": 13000 }, { "epoch": 26.04, "grad_norm": 39.00455093383789, "learning_rate": 6.029313043849407e-06, "loss": 0.4858, "step": 13020 }, { "epoch": 26.1, "grad_norm": 42.91631317138672, "learning_rate": 6.013936476782563e-06, "loss": 0.573, "step": 13050 }, { "epoch": 26.16, "grad_norm": 87.59916687011719, "learning_rate": 5.9985499025720354e-06, "loss": 0.4353, "step": 13080 }, { "epoch": 26.22, "grad_norm": 25.52212905883789, "learning_rate": 5.9831534730771e-06, "loss": 0.5075, "step": 13110 }, { "epoch": 26.28, "grad_norm": 72.47872161865234, "learning_rate": 5.967747340254303e-06, "loss": 0.5847, "step": 13140 }, { "epoch": 26.34, "grad_norm": 58.947288513183594, "learning_rate": 5.952331656155951e-06, "loss": 0.5281, "step": 13170 }, { "epoch": 26.4, "grad_norm": 110.84516906738281, "learning_rate": 5.936906572928625e-06, "loss": 0.5088, "step": 13200 }, { "epoch": 26.46, "grad_norm": 29.063140869140625, "learning_rate": 5.9214722428116675e-06, "loss": 0.5583, "step": 13230 }, { "epoch": 26.52, "grad_norm": 41.858192443847656, "learning_rate": 5.906028818135687e-06, "loss": 0.4315, "step": 13260 }, { "epoch": 26.58, "grad_norm": 46.3973388671875, "learning_rate": 5.89057645132105e-06, "loss": 0.5034, "step": 13290 }, { "epoch": 26.64, "grad_norm": 57.123966217041016, "learning_rate": 5.8751152948763815e-06, "loss": 0.4648, "step": 13320 }, { "epoch": 26.7, "grad_norm": 36.376487731933594, "learning_rate": 5.859645501397048e-06, "loss": 0.4411, "step": 13350 }, { "epoch": 26.76, "grad_norm": 34.153175354003906, "learning_rate": 5.844167223563669e-06, "loss": 0.7433, "step": 13380 }, { "epoch": 26.82, "grad_norm": 65.91962432861328, "learning_rate": 5.828680614140599e-06, "loss": 0.4586, "step": 13410 }, { "epoch": 26.88, "grad_norm": 30.4884033203125, "learning_rate": 5.813185825974419e-06, "loss": 0.5479, "step": 13440 }, { "epoch": 26.94, "grad_norm": 94.28384399414062, "learning_rate": 5.797683011992432e-06, "loss": 0.6423, "step": 13470 }, { "epoch": 27.0, "grad_norm": 24.540077209472656, "learning_rate": 5.782172325201155e-06, "loss": 0.521, "step": 13500 }, { "epoch": 27.0, "eval_loss": 0.4196639358997345, "eval_map": 0.7177, "eval_map_50": 0.9434, "eval_map_75": 0.8715, "eval_map_chicken": 0.7073, "eval_map_duck": 0.6685, "eval_map_large": 0.8353, "eval_map_medium": 0.7168, "eval_map_plant": 0.7771, "eval_map_small": 0.132, "eval_mar_1": 0.2879, "eval_mar_10": 0.7639, "eval_mar_100": 0.7697, "eval_mar_100_chicken": 0.7649, "eval_mar_100_duck": 0.7165, "eval_mar_100_plant": 0.8277, "eval_mar_large": 0.8799, "eval_mar_medium": 0.7777, "eval_mar_small": 0.2623, "eval_runtime": 5.0566, "eval_samples_per_second": 19.776, "eval_steps_per_second": 2.571, "step": 13500 }, { "epoch": 27.06, "grad_norm": 46.547821044921875, "learning_rate": 5.766653918684803e-06, "loss": 0.4824, "step": 13530 }, { "epoch": 27.12, "grad_norm": 54.376251220703125, "learning_rate": 5.751127945603786e-06, "loss": 0.5959, "step": 13560 }, { "epoch": 27.18, "grad_norm": 42.895103454589844, "learning_rate": 5.735594559193187e-06, "loss": 0.5927, "step": 13590 }, { "epoch": 27.24, "grad_norm": 78.81582641601562, "learning_rate": 5.720053912761261e-06, "loss": 0.4704, "step": 13620 }, { "epoch": 27.3, "grad_norm": 72.24491882324219, "learning_rate": 5.704506159687914e-06, "loss": 0.5529, "step": 13650 }, { "epoch": 27.36, "grad_norm": 61.65352249145508, "learning_rate": 5.68895145342319e-06, "loss": 0.4379, "step": 13680 }, { "epoch": 27.42, "grad_norm": 64.8173828125, "learning_rate": 5.673389947485763e-06, "loss": 0.4938, "step": 13710 }, { "epoch": 27.48, "grad_norm": 35.893592834472656, "learning_rate": 5.657821795461413e-06, "loss": 0.4969, "step": 13740 }, { "epoch": 27.54, "grad_norm": 53.43833923339844, "learning_rate": 5.642247151001515e-06, "loss": 0.6261, "step": 13770 }, { "epoch": 27.6, "grad_norm": 36.205841064453125, "learning_rate": 5.626666167821522e-06, "loss": 0.4915, "step": 13800 }, { "epoch": 27.66, "grad_norm": 49.39502716064453, "learning_rate": 5.611078999699448e-06, "loss": 0.4529, "step": 13830 }, { "epoch": 27.72, "grad_norm": 68.46619415283203, "learning_rate": 5.59548580047435e-06, "loss": 0.573, "step": 13860 }, { "epoch": 27.78, "grad_norm": 99.93022155761719, "learning_rate": 5.5798867240448075e-06, "loss": 0.4234, "step": 13890 }, { "epoch": 27.84, "grad_norm": 41.78444290161133, "learning_rate": 5.5642819243674085e-06, "loss": 0.5215, "step": 13920 }, { "epoch": 27.9, "grad_norm": 65.3072280883789, "learning_rate": 5.548671555455226e-06, "loss": 0.5085, "step": 13950 }, { "epoch": 27.96, "grad_norm": 67.302978515625, "learning_rate": 5.5330557713763e-06, "loss": 0.5433, "step": 13980 }, { "epoch": 28.0, "eval_loss": 0.3886251151561737, "eval_map": 0.7454, "eval_map_50": 0.9508, "eval_map_75": 0.8823, "eval_map_chicken": 0.7573, "eval_map_duck": 0.6941, "eval_map_large": 0.8448, "eval_map_medium": 0.7406, "eval_map_plant": 0.785, "eval_map_small": 0.2083, "eval_mar_1": 0.292, "eval_mar_10": 0.7833, "eval_mar_100": 0.789, "eval_mar_100_chicken": 0.8004, "eval_mar_100_duck": 0.733, "eval_mar_100_plant": 0.8334, "eval_mar_large": 0.8845, "eval_mar_medium": 0.7952, "eval_mar_small": 0.3064, "eval_runtime": 5.0862, "eval_samples_per_second": 19.661, "eval_steps_per_second": 2.556, "step": 14000 }, { "epoch": 28.02, "grad_norm": 50.869449615478516, "learning_rate": 5.517434726252113e-06, "loss": 0.5022, "step": 14010 }, { "epoch": 28.08, "grad_norm": 30.78757095336914, "learning_rate": 5.5018085742560745e-06, "loss": 0.4819, "step": 14040 }, { "epoch": 28.14, "grad_norm": 45.835391998291016, "learning_rate": 5.486177469611999e-06, "loss": 0.5521, "step": 14070 }, { "epoch": 28.2, "grad_norm": 112.30412292480469, "learning_rate": 5.470541566592573e-06, "loss": 0.4874, "step": 14100 }, { "epoch": 28.26, "grad_norm": 61.26950454711914, "learning_rate": 5.454901019517851e-06, "loss": 0.5017, "step": 14130 }, { "epoch": 28.32, "grad_norm": 35.90389633178711, "learning_rate": 5.439255982753717e-06, "loss": 0.5153, "step": 14160 }, { "epoch": 28.38, "grad_norm": 82.97974395751953, "learning_rate": 5.423606610710368e-06, "loss": 0.4807, "step": 14190 }, { "epoch": 28.44, "grad_norm": 24.63577651977539, "learning_rate": 5.4079530578407895e-06, "loss": 0.5761, "step": 14220 }, { "epoch": 28.5, "grad_norm": 70.0156021118164, "learning_rate": 5.392295478639226e-06, "loss": 0.4393, "step": 14250 }, { "epoch": 28.56, "grad_norm": 47.858985900878906, "learning_rate": 5.376634027639664e-06, "loss": 0.4543, "step": 14280 }, { "epoch": 28.62, "grad_norm": 41.32699966430664, "learning_rate": 5.360968859414305e-06, "loss": 0.5178, "step": 14310 }, { "epoch": 28.68, "grad_norm": 38.778343200683594, "learning_rate": 5.345300128572031e-06, "loss": 0.5076, "step": 14340 }, { "epoch": 28.74, "grad_norm": 101.67027282714844, "learning_rate": 5.32962798975689e-06, "loss": 0.4308, "step": 14370 }, { "epoch": 28.8, "grad_norm": 51.669864654541016, "learning_rate": 5.3139525976465675e-06, "loss": 0.4741, "step": 14400 }, { "epoch": 28.86, "grad_norm": 40.283546447753906, "learning_rate": 5.298274106950855e-06, "loss": 0.5707, "step": 14430 }, { "epoch": 28.92, "grad_norm": 124.74097442626953, "learning_rate": 5.282592672410124e-06, "loss": 0.4298, "step": 14460 }, { "epoch": 28.98, "grad_norm": 46.044212341308594, "learning_rate": 5.2669084487938025e-06, "loss": 0.3889, "step": 14490 }, { "epoch": 29.0, "eval_loss": 0.3713254928588867, "eval_map": 0.7492, "eval_map_50": 0.9553, "eval_map_75": 0.8998, "eval_map_chicken": 0.7677, "eval_map_duck": 0.6849, "eval_map_large": 0.8468, "eval_map_medium": 0.7492, "eval_map_plant": 0.7951, "eval_map_small": 0.2224, "eval_mar_1": 0.2891, "eval_mar_10": 0.7873, "eval_mar_100": 0.7936, "eval_mar_100_chicken": 0.8053, "eval_mar_100_duck": 0.7299, "eval_mar_100_plant": 0.8455, "eval_mar_large": 0.8921, "eval_mar_medium": 0.8026, "eval_mar_small": 0.3112, "eval_runtime": 5.3046, "eval_samples_per_second": 18.852, "eval_steps_per_second": 2.451, "step": 14500 }, { "epoch": 29.04, "grad_norm": 28.102954864501953, "learning_rate": 5.251221590898848e-06, "loss": 0.4486, "step": 14520 }, { "epoch": 29.1, "grad_norm": 157.14828491210938, "learning_rate": 5.235532253548213e-06, "loss": 0.5139, "step": 14550 }, { "epoch": 29.16, "grad_norm": 51.68550109863281, "learning_rate": 5.219840591589325e-06, "loss": 0.4739, "step": 14580 }, { "epoch": 29.22, "grad_norm": 54.422359466552734, "learning_rate": 5.204146759892551e-06, "loss": 0.4549, "step": 14610 }, { "epoch": 29.28, "grad_norm": 56.245521545410156, "learning_rate": 5.188450913349674e-06, "loss": 0.4747, "step": 14640 }, { "epoch": 29.34, "grad_norm": 41.02756881713867, "learning_rate": 5.172753206872363e-06, "loss": 0.5289, "step": 14670 }, { "epoch": 29.4, "grad_norm": 37.02859878540039, "learning_rate": 5.157053795390642e-06, "loss": 0.4792, "step": 14700 }, { "epoch": 29.46, "grad_norm": 59.5302619934082, "learning_rate": 5.141352833851367e-06, "loss": 0.4709, "step": 14730 }, { "epoch": 29.52, "grad_norm": 46.878326416015625, "learning_rate": 5.1256504772166885e-06, "loss": 0.5425, "step": 14760 }, { "epoch": 29.58, "grad_norm": 79.3340072631836, "learning_rate": 5.109946880462526e-06, "loss": 0.5793, "step": 14790 }, { "epoch": 29.64, "grad_norm": 65.08154296875, "learning_rate": 5.0942421985770415e-06, "loss": 0.4454, "step": 14820 }, { "epoch": 29.7, "grad_norm": 53.71400833129883, "learning_rate": 5.078536586559104e-06, "loss": 0.4082, "step": 14850 }, { "epoch": 29.76, "grad_norm": 71.08831024169922, "learning_rate": 5.062830199416764e-06, "loss": 0.532, "step": 14880 }, { "epoch": 29.82, "grad_norm": 41.64462661743164, "learning_rate": 5.047123192165722e-06, "loss": 0.4744, "step": 14910 }, { "epoch": 29.88, "grad_norm": 47.789791107177734, "learning_rate": 5.031415719827796e-06, "loss": 0.5136, "step": 14940 }, { "epoch": 29.94, "grad_norm": 76.24413299560547, "learning_rate": 5.015707937429398e-06, "loss": 0.4167, "step": 14970 }, { "epoch": 30.0, "grad_norm": 46.26760482788086, "learning_rate": 5e-06, "loss": 0.5103, "step": 15000 }, { "epoch": 30.0, "eval_loss": 0.35560786724090576, "eval_map": 0.7584, "eval_map_50": 0.9576, "eval_map_75": 0.9014, "eval_map_chicken": 0.7654, "eval_map_duck": 0.7165, "eval_map_large": 0.8517, "eval_map_medium": 0.7509, "eval_map_plant": 0.7934, "eval_map_small": 0.219, "eval_mar_1": 0.2939, "eval_mar_10": 0.7954, "eval_mar_100": 0.8015, "eval_mar_100_chicken": 0.8022, "eval_mar_100_duck": 0.7557, "eval_mar_100_plant": 0.8467, "eval_mar_large": 0.8979, "eval_mar_medium": 0.8078, "eval_mar_small": 0.3089, "eval_runtime": 5.0764, "eval_samples_per_second": 19.699, "eval_steps_per_second": 2.561, "step": 15000 }, { "epoch": 30.06, "grad_norm": 32.46073532104492, "learning_rate": 4.984292062570603e-06, "loss": 0.4897, "step": 15030 }, { "epoch": 30.12, "grad_norm": 60.483089447021484, "learning_rate": 4.968584280172206e-06, "loss": 0.436, "step": 15060 }, { "epoch": 30.18, "grad_norm": 66.74795532226562, "learning_rate": 4.952876807834281e-06, "loss": 0.5319, "step": 15090 }, { "epoch": 30.24, "grad_norm": 72.88277435302734, "learning_rate": 4.937169800583237e-06, "loss": 0.4765, "step": 15120 }, { "epoch": 30.3, "grad_norm": 40.566162109375, "learning_rate": 4.921463413440898e-06, "loss": 0.4799, "step": 15150 }, { "epoch": 30.36, "grad_norm": 65.94972229003906, "learning_rate": 4.90575780142296e-06, "loss": 0.4977, "step": 15180 }, { "epoch": 30.42, "grad_norm": 56.45389175415039, "learning_rate": 4.890053119537475e-06, "loss": 0.4175, "step": 15210 }, { "epoch": 30.48, "grad_norm": 47.09212112426758, "learning_rate": 4.874349522783313e-06, "loss": 0.5274, "step": 15240 }, { "epoch": 30.54, "grad_norm": 145.99957275390625, "learning_rate": 4.8586471661486345e-06, "loss": 0.3792, "step": 15270 }, { "epoch": 30.6, "grad_norm": 86.61822509765625, "learning_rate": 4.842946204609359e-06, "loss": 0.474, "step": 15300 }, { "epoch": 30.66, "grad_norm": 136.17213439941406, "learning_rate": 4.827246793127639e-06, "loss": 0.4006, "step": 15330 }, { "epoch": 30.72, "grad_norm": 35.06562042236328, "learning_rate": 4.811549086650327e-06, "loss": 0.5298, "step": 15360 }, { "epoch": 30.78, "grad_norm": 49.849159240722656, "learning_rate": 4.79585324010745e-06, "loss": 0.5034, "step": 15390 }, { "epoch": 30.84, "grad_norm": 50.45303726196289, "learning_rate": 4.780159408410677e-06, "loss": 0.5148, "step": 15420 }, { "epoch": 30.9, "grad_norm": 94.5147705078125, "learning_rate": 4.7644677464517874e-06, "loss": 0.4116, "step": 15450 }, { "epoch": 30.96, "grad_norm": 32.6632080078125, "learning_rate": 4.748778409101153e-06, "loss": 0.4458, "step": 15480 }, { "epoch": 31.0, "eval_loss": 0.3680790960788727, "eval_map": 0.7355, "eval_map_50": 0.9518, "eval_map_75": 0.8831, "eval_map_chicken": 0.734, "eval_map_duck": 0.6771, "eval_map_large": 0.8569, "eval_map_medium": 0.7311, "eval_map_plant": 0.7955, "eval_map_small": 0.1416, "eval_mar_1": 0.292, "eval_mar_10": 0.7773, "eval_mar_100": 0.7814, "eval_mar_100_chicken": 0.7742, "eval_mar_100_duck": 0.7247, "eval_mar_100_plant": 0.8452, "eval_mar_large": 0.9008, "eval_mar_medium": 0.7892, "eval_mar_small": 0.2358, "eval_runtime": 5.1428, "eval_samples_per_second": 19.445, "eval_steps_per_second": 2.528, "step": 15500 }, { "epoch": 31.02, "grad_norm": 92.16204071044922, "learning_rate": 4.733091551206198e-06, "loss": 0.3926, "step": 15510 }, { "epoch": 31.08, "grad_norm": 75.78022766113281, "learning_rate": 4.717407327589878e-06, "loss": 0.4623, "step": 15540 }, { "epoch": 31.14, "grad_norm": 40.157047271728516, "learning_rate": 4.7017258930491474e-06, "loss": 0.4647, "step": 15570 }, { "epoch": 31.2, "grad_norm": 61.89482498168945, "learning_rate": 4.686047402353433e-06, "loss": 0.4591, "step": 15600 }, { "epoch": 31.26, "grad_norm": 85.72875213623047, "learning_rate": 4.670372010243111e-06, "loss": 0.4529, "step": 15630 }, { "epoch": 31.32, "grad_norm": 69.27102661132812, "learning_rate": 4.654699871427972e-06, "loss": 0.4169, "step": 15660 }, { "epoch": 31.38, "grad_norm": 96.01777648925781, "learning_rate": 4.639031140585697e-06, "loss": 0.4641, "step": 15690 }, { "epoch": 31.44, "grad_norm": 36.54241180419922, "learning_rate": 4.6233659723603374e-06, "loss": 0.4236, "step": 15720 }, { "epoch": 31.5, "grad_norm": 54.6783561706543, "learning_rate": 4.6077045213607765e-06, "loss": 0.4513, "step": 15750 }, { "epoch": 31.56, "grad_norm": 61.09621047973633, "learning_rate": 4.592046942159213e-06, "loss": 0.5054, "step": 15780 }, { "epoch": 31.62, "grad_norm": 47.04421615600586, "learning_rate": 4.576393389289633e-06, "loss": 0.4794, "step": 15810 }, { "epoch": 31.68, "grad_norm": 45.6216926574707, "learning_rate": 4.560744017246284e-06, "loss": 0.4868, "step": 15840 }, { "epoch": 31.74, "grad_norm": 43.895748138427734, "learning_rate": 4.545098980482151e-06, "loss": 0.5823, "step": 15870 }, { "epoch": 31.8, "grad_norm": 68.07852935791016, "learning_rate": 4.529458433407429e-06, "loss": 0.3868, "step": 15900 }, { "epoch": 31.86, "grad_norm": 33.31740951538086, "learning_rate": 4.513822530388004e-06, "loss": 0.6123, "step": 15930 }, { "epoch": 31.92, "grad_norm": 101.1479263305664, "learning_rate": 4.4981914257439254e-06, "loss": 0.4639, "step": 15960 }, { "epoch": 31.98, "grad_norm": 69.75340270996094, "learning_rate": 4.482565273747888e-06, "loss": 0.4369, "step": 15990 }, { "epoch": 32.0, "eval_loss": 0.3522694408893585, "eval_map": 0.7495, "eval_map_50": 0.9499, "eval_map_75": 0.8877, "eval_map_chicken": 0.765, "eval_map_duck": 0.6903, "eval_map_large": 0.8514, "eval_map_medium": 0.7447, "eval_map_plant": 0.7932, "eval_map_small": 0.142, "eval_mar_1": 0.2935, "eval_mar_10": 0.7877, "eval_mar_100": 0.7923, "eval_mar_100_chicken": 0.8027, "eval_mar_100_duck": 0.7309, "eval_mar_100_plant": 0.8432, "eval_mar_large": 0.895, "eval_mar_medium": 0.8026, "eval_mar_small": 0.2589, "eval_runtime": 5.6761, "eval_samples_per_second": 17.618, "eval_steps_per_second": 2.29, "step": 16000 }, { "epoch": 32.04, "grad_norm": 73.68572998046875, "learning_rate": 4.466944228623701e-06, "loss": 0.4943, "step": 16020 }, { "epoch": 32.1, "grad_norm": 59.75843048095703, "learning_rate": 4.451328444544774e-06, "loss": 0.7525, "step": 16050 }, { "epoch": 32.16, "grad_norm": 36.496517181396484, "learning_rate": 4.4357180756325915e-06, "loss": 0.5056, "step": 16080 }, { "epoch": 32.22, "grad_norm": 57.11168670654297, "learning_rate": 4.420113275955193e-06, "loss": 0.4615, "step": 16110 }, { "epoch": 32.28, "grad_norm": 65.62242126464844, "learning_rate": 4.404514199525651e-06, "loss": 0.407, "step": 16140 }, { "epoch": 32.34, "grad_norm": 60.669490814208984, "learning_rate": 4.388921000300553e-06, "loss": 0.548, "step": 16170 }, { "epoch": 32.4, "grad_norm": 79.71160125732422, "learning_rate": 4.373333832178478e-06, "loss": 0.4463, "step": 16200 }, { "epoch": 32.46, "grad_norm": 60.13050842285156, "learning_rate": 4.357752848998486e-06, "loss": 0.4668, "step": 16230 }, { "epoch": 32.52, "grad_norm": 68.18923950195312, "learning_rate": 4.342178204538588e-06, "loss": 0.5161, "step": 16260 }, { "epoch": 32.58, "grad_norm": 39.04051208496094, "learning_rate": 4.326610052514238e-06, "loss": 0.4557, "step": 16290 }, { "epoch": 32.64, "grad_norm": 29.669092178344727, "learning_rate": 4.31104854657681e-06, "loss": 0.4081, "step": 16320 }, { "epoch": 32.7, "grad_norm": 125.63433074951172, "learning_rate": 4.295493840312087e-06, "loss": 0.5007, "step": 16350 }, { "epoch": 32.76, "grad_norm": 65.3372802734375, "learning_rate": 4.279946087238739e-06, "loss": 0.4988, "step": 16380 }, { "epoch": 32.82, "grad_norm": 37.54350662231445, "learning_rate": 4.264405440806813e-06, "loss": 0.4608, "step": 16410 }, { "epoch": 32.88, "grad_norm": 96.40494537353516, "learning_rate": 4.248872054396215e-06, "loss": 0.4581, "step": 16440 }, { "epoch": 32.94, "grad_norm": 47.8939094543457, "learning_rate": 4.233346081315197e-06, "loss": 0.5492, "step": 16470 }, { "epoch": 33.0, "grad_norm": 0.001348652527667582, "learning_rate": 4.217827674798845e-06, "loss": 0.447, "step": 16500 }, { "epoch": 33.0, "eval_loss": 0.3665035367012024, "eval_map": 0.7448, "eval_map_50": 0.954, "eval_map_75": 0.8912, "eval_map_chicken": 0.7453, "eval_map_duck": 0.6933, "eval_map_large": 0.8505, "eval_map_medium": 0.7412, "eval_map_plant": 0.796, "eval_map_small": 0.1577, "eval_mar_1": 0.2922, "eval_mar_10": 0.7844, "eval_mar_100": 0.7879, "eval_mar_100_chicken": 0.7813, "eval_mar_100_duck": 0.7361, "eval_mar_100_plant": 0.8464, "eval_mar_large": 0.8929, "eval_mar_medium": 0.8005, "eval_mar_small": 0.2742, "eval_runtime": 5.1427, "eval_samples_per_second": 19.445, "eval_steps_per_second": 2.528, "step": 16500 }, { "epoch": 33.06, "grad_norm": 50.67320251464844, "learning_rate": 4.202316988007568e-06, "loss": 0.4183, "step": 16530 }, { "epoch": 33.12, "grad_norm": 51.36381149291992, "learning_rate": 4.186814174025582e-06, "loss": 0.4446, "step": 16560 }, { "epoch": 33.18, "grad_norm": 86.76451110839844, "learning_rate": 4.171319385859402e-06, "loss": 0.3794, "step": 16590 }, { "epoch": 33.24, "grad_norm": 82.5096206665039, "learning_rate": 4.155832776436331e-06, "loss": 0.4867, "step": 16620 }, { "epoch": 33.3, "grad_norm": 110.49205780029297, "learning_rate": 4.140354498602952e-06, "loss": 0.454, "step": 16650 }, { "epoch": 33.36, "grad_norm": 29.124536514282227, "learning_rate": 4.124884705123619e-06, "loss": 0.5245, "step": 16680 }, { "epoch": 33.42, "grad_norm": 78.4069595336914, "learning_rate": 4.109423548678949e-06, "loss": 0.4232, "step": 16710 }, { "epoch": 33.48, "grad_norm": 68.84821319580078, "learning_rate": 4.093971181864313e-06, "loss": 0.4485, "step": 16740 }, { "epoch": 33.54, "grad_norm": 91.24239349365234, "learning_rate": 4.078527757188333e-06, "loss": 0.4898, "step": 16770 }, { "epoch": 33.6, "grad_norm": 61.37797546386719, "learning_rate": 4.063093427071376e-06, "loss": 0.6196, "step": 16800 }, { "epoch": 33.66, "grad_norm": 51.44956588745117, "learning_rate": 4.047668343844051e-06, "loss": 0.5473, "step": 16830 }, { "epoch": 33.72, "grad_norm": 80.08527374267578, "learning_rate": 4.032252659745699e-06, "loss": 0.4776, "step": 16860 }, { "epoch": 33.78, "grad_norm": 42.223960876464844, "learning_rate": 4.016846526922901e-06, "loss": 0.5304, "step": 16890 }, { "epoch": 33.84, "grad_norm": 40.85383605957031, "learning_rate": 4.001450097427965e-06, "loss": 0.4721, "step": 16920 }, { "epoch": 33.9, "grad_norm": 25.363073348999023, "learning_rate": 3.986063523217439e-06, "loss": 0.4369, "step": 16950 }, { "epoch": 33.96, "grad_norm": 53.42643737792969, "learning_rate": 3.970686956150595e-06, "loss": 0.4692, "step": 16980 }, { "epoch": 34.0, "eval_loss": 0.3454967439174652, "eval_map": 0.7589, "eval_map_50": 0.954, "eval_map_75": 0.899, "eval_map_chicken": 0.7709, "eval_map_duck": 0.7058, "eval_map_large": 0.863, "eval_map_medium": 0.7459, "eval_map_plant": 0.7999, "eval_map_small": 0.1729, "eval_mar_1": 0.2949, "eval_mar_10": 0.798, "eval_mar_100": 0.8038, "eval_mar_100_chicken": 0.8093, "eval_mar_100_duck": 0.7546, "eval_mar_100_plant": 0.8476, "eval_mar_large": 0.9033, "eval_mar_medium": 0.8068, "eval_mar_small": 0.3123, "eval_runtime": 5.1562, "eval_samples_per_second": 19.394, "eval_steps_per_second": 2.521, "step": 17000 }, { "epoch": 34.02, "grad_norm": 52.77671813964844, "learning_rate": 3.955320547987943e-06, "loss": 0.5145, "step": 17010 }, { "epoch": 34.08, "grad_norm": 59.353485107421875, "learning_rate": 3.939964450389728e-06, "loss": 0.4202, "step": 17040 }, { "epoch": 34.14, "grad_norm": 71.41014099121094, "learning_rate": 3.924618814914435e-06, "loss": 0.4365, "step": 17070 }, { "epoch": 34.2, "grad_norm": 59.05385971069336, "learning_rate": 3.909283793017289e-06, "loss": 0.4725, "step": 17100 }, { "epoch": 34.26, "grad_norm": 74.0579605102539, "learning_rate": 3.8939595360487655e-06, "loss": 0.4601, "step": 17130 }, { "epoch": 34.32, "grad_norm": 26.610624313354492, "learning_rate": 3.8786461952530955e-06, "loss": 0.4415, "step": 17160 }, { "epoch": 34.38, "grad_norm": 97.6423110961914, "learning_rate": 3.863343921766769e-06, "loss": 0.441, "step": 17190 }, { "epoch": 34.44, "grad_norm": 97.2457046508789, "learning_rate": 3.8480528666170495e-06, "loss": 0.4235, "step": 17220 }, { "epoch": 34.5, "grad_norm": 37.252906799316406, "learning_rate": 3.832773180720475e-06, "loss": 0.3976, "step": 17250 }, { "epoch": 34.56, "grad_norm": 37.12264633178711, "learning_rate": 3.817505014881378e-06, "loss": 0.5479, "step": 17280 }, { "epoch": 34.62, "grad_norm": 64.19234466552734, "learning_rate": 3.8022485197903924e-06, "loss": 0.4438, "step": 17310 }, { "epoch": 34.68, "grad_norm": 52.00288009643555, "learning_rate": 3.787003846022964e-06, "loss": 0.4803, "step": 17340 }, { "epoch": 34.74, "grad_norm": 39.877071380615234, "learning_rate": 3.7717711440378695e-06, "loss": 0.51, "step": 17370 }, { "epoch": 34.8, "grad_norm": 62.76517105102539, "learning_rate": 3.756550564175727e-06, "loss": 0.4295, "step": 17400 }, { "epoch": 34.86, "grad_norm": 42.63980484008789, "learning_rate": 3.7413422566575153e-06, "loss": 0.4405, "step": 17430 }, { "epoch": 34.92, "grad_norm": 62.36055374145508, "learning_rate": 3.7261463715830902e-06, "loss": 0.402, "step": 17460 }, { "epoch": 34.98, "grad_norm": 58.33619689941406, "learning_rate": 3.7109630589297014e-06, "loss": 0.4272, "step": 17490 }, { "epoch": 35.0, "eval_loss": 0.3380710482597351, "eval_map": 0.767, "eval_map_50": 0.9568, "eval_map_75": 0.903, "eval_map_chicken": 0.7842, "eval_map_duck": 0.7246, "eval_map_large": 0.852, "eval_map_medium": 0.7623, "eval_map_plant": 0.7922, "eval_map_small": 0.1734, "eval_mar_1": 0.2948, "eval_mar_10": 0.802, "eval_mar_100": 0.8061, "eval_mar_100_chicken": 0.8204, "eval_mar_100_duck": 0.7546, "eval_mar_100_plant": 0.8432, "eval_mar_large": 0.8962, "eval_mar_medium": 0.8136, "eval_mar_small": 0.2907, "eval_runtime": 5.0658, "eval_samples_per_second": 19.74, "eval_steps_per_second": 2.566, "step": 17500 }, { "epoch": 35.04, "grad_norm": 41.134178161621094, "learning_rate": 3.695792468550517e-06, "loss": 0.4129, "step": 17520 }, { "epoch": 35.1, "grad_norm": 25.44190216064453, "learning_rate": 3.680634750173137e-06, "loss": 0.4478, "step": 17550 }, { "epoch": 35.16, "grad_norm": 82.22879028320312, "learning_rate": 3.6654900533981234e-06, "loss": 0.4787, "step": 17580 }, { "epoch": 35.22, "grad_norm": 50.50277328491211, "learning_rate": 3.6503585276975196e-06, "loss": 0.369, "step": 17610 }, { "epoch": 35.28, "grad_norm": 48.85622024536133, "learning_rate": 3.635240322413375e-06, "loss": 0.461, "step": 17640 }, { "epoch": 35.34, "grad_norm": 68.70919799804688, "learning_rate": 3.6201355867562725e-06, "loss": 0.4257, "step": 17670 }, { "epoch": 35.4, "grad_norm": 57.635738372802734, "learning_rate": 3.6050444698038547e-06, "loss": 0.3771, "step": 17700 }, { "epoch": 35.46, "grad_norm": 55.46888732910156, "learning_rate": 3.5899671204993535e-06, "loss": 0.5256, "step": 17730 }, { "epoch": 35.52, "grad_norm": 41.51885986328125, "learning_rate": 3.5749036876501196e-06, "loss": 0.5109, "step": 17760 }, { "epoch": 35.58, "grad_norm": 49.13798904418945, "learning_rate": 3.559854319926156e-06, "loss": 0.4184, "step": 17790 }, { "epoch": 35.64, "grad_norm": 60.9365119934082, "learning_rate": 3.5448191658586423e-06, "loss": 0.4215, "step": 17820 }, { "epoch": 35.7, "grad_norm": 66.89413452148438, "learning_rate": 3.5297983738384813e-06, "loss": 0.5379, "step": 17850 }, { "epoch": 35.76, "grad_norm": 116.77861022949219, "learning_rate": 3.5147920921148267e-06, "loss": 0.4938, "step": 17880 }, { "epoch": 35.82, "grad_norm": 0.00022027752129361033, "learning_rate": 3.49980046879362e-06, "loss": 0.5032, "step": 17910 }, { "epoch": 35.88, "grad_norm": 51.908206939697266, "learning_rate": 3.484823651836131e-06, "loss": 0.4807, "step": 17940 }, { "epoch": 35.94, "grad_norm": 56.6352653503418, "learning_rate": 3.4698617890574972e-06, "loss": 0.4326, "step": 17970 }, { "epoch": 36.0, "grad_norm": 47.75572967529297, "learning_rate": 3.4549150281252635e-06, "loss": 0.4021, "step": 18000 }, { "epoch": 36.0, "eval_loss": 0.3322797417640686, "eval_map": 0.7686, "eval_map_50": 0.9551, "eval_map_75": 0.8938, "eval_map_chicken": 0.7776, "eval_map_duck": 0.7245, "eval_map_large": 0.8616, "eval_map_medium": 0.7621, "eval_map_plant": 0.8038, "eval_map_small": 0.1892, "eval_mar_1": 0.2969, "eval_mar_10": 0.8025, "eval_mar_100": 0.8067, "eval_mar_100_chicken": 0.8133, "eval_mar_100_duck": 0.7577, "eval_mar_100_plant": 0.849, "eval_mar_large": 0.9025, "eval_mar_medium": 0.8122, "eval_mar_small": 0.3049, "eval_runtime": 5.0345, "eval_samples_per_second": 19.863, "eval_steps_per_second": 2.582, "step": 18000 }, { "epoch": 36.06, "grad_norm": 58.42578125, "learning_rate": 3.4399835165579266e-06, "loss": 0.4267, "step": 18030 }, { "epoch": 36.12, "grad_norm": 48.94293212890625, "learning_rate": 3.4250674017234774e-06, "loss": 0.4093, "step": 18060 }, { "epoch": 36.18, "grad_norm": 38.52609634399414, "learning_rate": 3.4101668308379465e-06, "loss": 0.4707, "step": 18090 }, { "epoch": 36.24, "grad_norm": 41.78977584838867, "learning_rate": 3.3952819509639534e-06, "loss": 0.5579, "step": 18120 }, { "epoch": 36.3, "grad_norm": 65.99064636230469, "learning_rate": 3.3804129090092542e-06, "loss": 0.4812, "step": 18150 }, { "epoch": 36.36, "grad_norm": 94.7818603515625, "learning_rate": 3.3655598517252886e-06, "loss": 0.4009, "step": 18180 }, { "epoch": 36.42, "grad_norm": 39.25736999511719, "learning_rate": 3.350722925705736e-06, "loss": 0.4333, "step": 18210 }, { "epoch": 36.48, "grad_norm": 36.73288345336914, "learning_rate": 3.3359022773850673e-06, "loss": 0.4128, "step": 18240 }, { "epoch": 36.54, "grad_norm": 93.98817443847656, "learning_rate": 3.3210980530370974e-06, "loss": 0.41, "step": 18270 }, { "epoch": 36.6, "grad_norm": 49.68222427368164, "learning_rate": 3.3063103987735433e-06, "loss": 0.5326, "step": 18300 }, { "epoch": 36.66, "grad_norm": 41.902557373046875, "learning_rate": 3.2915394605425836e-06, "loss": 0.3922, "step": 18330 }, { "epoch": 36.72, "grad_norm": 88.83726501464844, "learning_rate": 3.2767853841274154e-06, "loss": 0.4792, "step": 18360 }, { "epoch": 36.78, "grad_norm": 33.33390808105469, "learning_rate": 3.262048315144816e-06, "loss": 0.4964, "step": 18390 }, { "epoch": 36.84, "grad_norm": 92.82958984375, "learning_rate": 3.247328399043706e-06, "loss": 0.4358, "step": 18420 }, { "epoch": 36.9, "grad_norm": 63.93076705932617, "learning_rate": 3.2326257811037154e-06, "loss": 0.4057, "step": 18450 }, { "epoch": 36.96, "grad_norm": 74.28779602050781, "learning_rate": 3.217940606433747e-06, "loss": 0.4582, "step": 18480 }, { "epoch": 37.0, "eval_loss": 0.3262586295604706, "eval_map": 0.7732, "eval_map_50": 0.9547, "eval_map_75": 0.9023, "eval_map_chicken": 0.7729, "eval_map_duck": 0.7298, "eval_map_large": 0.8742, "eval_map_medium": 0.7748, "eval_map_plant": 0.817, "eval_map_small": 0.1477, "eval_mar_1": 0.3015, "eval_mar_10": 0.8092, "eval_mar_100": 0.8132, "eval_mar_100_chicken": 0.812, "eval_mar_100_duck": 0.7619, "eval_mar_100_plant": 0.8657, "eval_mar_large": 0.9163, "eval_mar_medium": 0.8251, "eval_mar_small": 0.2634, "eval_runtime": 5.1374, "eval_samples_per_second": 19.465, "eval_steps_per_second": 2.53, "step": 18500 }, { "epoch": 37.02, "grad_norm": 32.50000762939453, "learning_rate": 3.2032730199705477e-06, "loss": 0.438, "step": 18510 }, { "epoch": 37.08, "grad_norm": 59.4605598449707, "learning_rate": 3.188623166477272e-06, "loss": 0.4954, "step": 18540 }, { "epoch": 37.14, "grad_norm": 78.10517120361328, "learning_rate": 3.1739911905420617e-06, "loss": 0.3849, "step": 18570 }, { "epoch": 37.2, "grad_norm": 63.686492919921875, "learning_rate": 3.1593772365766107e-06, "loss": 0.3561, "step": 18600 }, { "epoch": 37.26, "grad_norm": 46.54610061645508, "learning_rate": 3.144781448814746e-06, "loss": 0.4171, "step": 18630 }, { "epoch": 37.32, "grad_norm": 44.2602424621582, "learning_rate": 3.130203971310999e-06, "loss": 0.4487, "step": 18660 }, { "epoch": 37.38, "grad_norm": 100.22451782226562, "learning_rate": 3.1156449479391876e-06, "loss": 0.4211, "step": 18690 }, { "epoch": 37.44, "grad_norm": 71.37747192382812, "learning_rate": 3.1011045223909954e-06, "loss": 0.5317, "step": 18720 }, { "epoch": 37.5, "grad_norm": 0.0002173359098378569, "learning_rate": 3.0865828381745515e-06, "loss": 0.4516, "step": 18750 }, { "epoch": 37.56, "grad_norm": 53.496341705322266, "learning_rate": 3.0720800386130176e-06, "loss": 0.4133, "step": 18780 }, { "epoch": 37.62, "grad_norm": 58.87167739868164, "learning_rate": 3.0575962668431704e-06, "loss": 0.4629, "step": 18810 }, { "epoch": 37.68, "grad_norm": 26.332555770874023, "learning_rate": 3.043131665813988e-06, "loss": 0.4264, "step": 18840 }, { "epoch": 37.74, "grad_norm": 62.68268585205078, "learning_rate": 3.028686378285245e-06, "loss": 0.459, "step": 18870 }, { "epoch": 37.8, "grad_norm": 105.45973205566406, "learning_rate": 3.0142605468260976e-06, "loss": 0.3687, "step": 18900 }, { "epoch": 37.86, "grad_norm": 60.29586410522461, "learning_rate": 2.9998543138136773e-06, "loss": 0.341, "step": 18930 }, { "epoch": 37.92, "grad_norm": 48.2047119140625, "learning_rate": 2.9854678214316875e-06, "loss": 0.3729, "step": 18960 }, { "epoch": 37.98, "grad_norm": 34.51201248168945, "learning_rate": 2.9711012116690007e-06, "loss": 0.3992, "step": 18990 }, { "epoch": 38.0, "eval_loss": 0.3207389712333679, "eval_map": 0.7799, "eval_map_50": 0.956, "eval_map_75": 0.9064, "eval_map_chicken": 0.7833, "eval_map_duck": 0.7384, "eval_map_large": 0.873, "eval_map_medium": 0.7823, "eval_map_plant": 0.818, "eval_map_small": 0.1767, "eval_mar_1": 0.3014, "eval_mar_10": 0.8168, "eval_mar_100": 0.8209, "eval_mar_100_chicken": 0.8218, "eval_mar_100_duck": 0.7732, "eval_mar_100_plant": 0.8677, "eval_mar_large": 0.9172, "eval_mar_medium": 0.8312, "eval_mar_small": 0.3028, "eval_runtime": 5.0908, "eval_samples_per_second": 19.643, "eval_steps_per_second": 2.554, "step": 19000 }, { "epoch": 38.04, "grad_norm": 45.1266975402832, "learning_rate": 2.9567546263182554e-06, "loss": 0.4895, "step": 19020 }, { "epoch": 38.1, "grad_norm": 77.6568374633789, "learning_rate": 2.9424282069744564e-06, "loss": 0.47, "step": 19050 }, { "epoch": 38.16, "grad_norm": 85.21626281738281, "learning_rate": 2.92812209503358e-06, "loss": 0.4005, "step": 19080 }, { "epoch": 38.22, "grad_norm": 62.11589431762695, "learning_rate": 2.9138364316911747e-06, "loss": 0.3894, "step": 19110 }, { "epoch": 38.28, "grad_norm": 50.71180725097656, "learning_rate": 2.899571357940969e-06, "loss": 0.4134, "step": 19140 }, { "epoch": 38.34, "grad_norm": 72.69100952148438, "learning_rate": 2.8853270145734846e-06, "loss": 0.3971, "step": 19170 }, { "epoch": 38.4, "grad_norm": 27.520477294921875, "learning_rate": 2.871103542174637e-06, "loss": 0.3922, "step": 19200 }, { "epoch": 38.46, "grad_norm": 64.30564880371094, "learning_rate": 2.856901081124359e-06, "loss": 0.4765, "step": 19230 }, { "epoch": 38.52, "grad_norm": 54.069091796875, "learning_rate": 2.8427197715952047e-06, "loss": 0.4478, "step": 19260 }, { "epoch": 38.58, "grad_norm": 62.98984146118164, "learning_rate": 2.8285597535509775e-06, "loss": 0.4548, "step": 19290 }, { "epoch": 38.64, "grad_norm": 52.520530700683594, "learning_rate": 2.814421166745337e-06, "loss": 0.529, "step": 19320 }, { "epoch": 38.7, "grad_norm": 71.8565902709961, "learning_rate": 2.800304150720424e-06, "loss": 0.4645, "step": 19350 }, { "epoch": 38.76, "grad_norm": 44.72001266479492, "learning_rate": 2.7862088448054936e-06, "loss": 0.4887, "step": 19380 }, { "epoch": 38.82, "grad_norm": 50.02251052856445, "learning_rate": 2.772135388115519e-06, "loss": 0.4167, "step": 19410 }, { "epoch": 38.88, "grad_norm": 59.54885482788086, "learning_rate": 2.7580839195498397e-06, "loss": 0.393, "step": 19440 }, { "epoch": 38.94, "grad_norm": 72.14510345458984, "learning_rate": 2.7440545777907747e-06, "loss": 0.4157, "step": 19470 }, { "epoch": 39.0, "grad_norm": 117.51093292236328, "learning_rate": 2.7300475013022666e-06, "loss": 0.4286, "step": 19500 }, { "epoch": 39.0, "eval_loss": 0.3193737268447876, "eval_map": 0.7717, "eval_map_50": 0.9567, "eval_map_75": 0.8986, "eval_map_chicken": 0.7752, "eval_map_duck": 0.7223, "eval_map_large": 0.8779, "eval_map_medium": 0.7677, "eval_map_plant": 0.8175, "eval_map_small": 0.1626, "eval_mar_1": 0.3033, "eval_mar_10": 0.8101, "eval_mar_100": 0.8139, "eval_mar_100_chicken": 0.8204, "eval_mar_100_duck": 0.7598, "eval_mar_100_plant": 0.8614, "eval_mar_large": 0.918, "eval_mar_medium": 0.82, "eval_mar_small": 0.2835, "eval_runtime": 5.0222, "eval_samples_per_second": 19.912, "eval_steps_per_second": 2.589, "step": 19500 }, { "epoch": 39.06, "grad_norm": 57.47135925292969, "learning_rate": 2.716062828328502e-06, "loss": 0.4059, "step": 19530 }, { "epoch": 39.12, "grad_norm": 28.567541122436523, "learning_rate": 2.7021006968925613e-06, "loss": 0.4349, "step": 19560 }, { "epoch": 39.18, "grad_norm": 38.38969039916992, "learning_rate": 2.6881612447950425e-06, "loss": 0.3861, "step": 19590 }, { "epoch": 39.24, "grad_norm": 62.003700256347656, "learning_rate": 2.6742446096127086e-06, "loss": 0.3273, "step": 19620 }, { "epoch": 39.3, "grad_norm": 33.330116271972656, "learning_rate": 2.6603509286971342e-06, "loss": 0.478, "step": 19650 }, { "epoch": 39.36, "grad_norm": 102.9520492553711, "learning_rate": 2.646480339173337e-06, "loss": 0.4294, "step": 19680 }, { "epoch": 39.42, "grad_norm": 38.9061393737793, "learning_rate": 2.6326329779384397e-06, "loss": 0.4171, "step": 19710 }, { "epoch": 39.48, "grad_norm": 33.986854553222656, "learning_rate": 2.618808981660304e-06, "loss": 0.487, "step": 19740 }, { "epoch": 39.54, "grad_norm": 2313.75537109375, "learning_rate": 2.6050084867761953e-06, "loss": 0.5018, "step": 19770 }, { "epoch": 39.6, "grad_norm": 40.18400192260742, "learning_rate": 2.5912316294914232e-06, "loss": 0.4993, "step": 19800 }, { "epoch": 39.66, "grad_norm": 58.73672103881836, "learning_rate": 2.5774785457780107e-06, "loss": 0.4466, "step": 19830 }, { "epoch": 39.72, "grad_norm": 113.0173110961914, "learning_rate": 2.5637493713733376e-06, "loss": 0.4275, "step": 19860 }, { "epoch": 39.78, "grad_norm": 62.983646392822266, "learning_rate": 2.5500442417788176e-06, "loss": 0.4815, "step": 19890 }, { "epoch": 39.84, "grad_norm": 41.0040397644043, "learning_rate": 2.536363292258543e-06, "loss": 0.4262, "step": 19920 }, { "epoch": 39.9, "grad_norm": 24.92264175415039, "learning_rate": 2.5227066578379624e-06, "loss": 0.5684, "step": 19950 }, { "epoch": 39.96, "grad_norm": 57.32313537597656, "learning_rate": 2.509074473302546e-06, "loss": 0.4488, "step": 19980 }, { "epoch": 40.0, "eval_loss": 0.3184027671813965, "eval_map": 0.7718, "eval_map_50": 0.9566, "eval_map_75": 0.9047, "eval_map_chicken": 0.7776, "eval_map_duck": 0.7156, "eval_map_large": 0.8809, "eval_map_medium": 0.7702, "eval_map_plant": 0.8223, "eval_map_small": 0.1921, "eval_mar_1": 0.2999, "eval_mar_10": 0.8092, "eval_mar_100": 0.8141, "eval_mar_100_chicken": 0.8187, "eval_mar_100_duck": 0.7546, "eval_mar_100_plant": 0.8689, "eval_mar_large": 0.9192, "eval_mar_medium": 0.8238, "eval_mar_small": 0.3002, "eval_runtime": 5.1382, "eval_samples_per_second": 19.462, "eval_steps_per_second": 2.53, "step": 20000 }, { "epoch": 40.02, "grad_norm": 62.7071533203125, "learning_rate": 2.49546687319645e-06, "loss": 0.4726, "step": 20010 }, { "epoch": 40.08, "grad_norm": 87.53660583496094, "learning_rate": 2.4818839918211963e-06, "loss": 0.3857, "step": 20040 }, { "epoch": 40.14, "grad_norm": 34.03664016723633, "learning_rate": 2.4683259632343363e-06, "loss": 0.3887, "step": 20070 }, { "epoch": 40.2, "grad_norm": 67.48214721679688, "learning_rate": 2.4547929212481436e-06, "loss": 0.4193, "step": 20100 }, { "epoch": 40.26, "grad_norm": 72.2217788696289, "learning_rate": 2.4412849994282744e-06, "loss": 0.4498, "step": 20130 }, { "epoch": 40.32, "grad_norm": 54.74772262573242, "learning_rate": 2.4278023310924676e-06, "loss": 0.4496, "step": 20160 }, { "epoch": 40.38, "grad_norm": 26.028186798095703, "learning_rate": 2.4143450493092146e-06, "loss": 0.4078, "step": 20190 }, { "epoch": 40.44, "grad_norm": 71.3542709350586, "learning_rate": 2.4009132868964525e-06, "loss": 0.5182, "step": 20220 }, { "epoch": 40.5, "grad_norm": 36.26480484008789, "learning_rate": 2.387507176420256e-06, "loss": 0.3948, "step": 20250 }, { "epoch": 40.56, "grad_norm": 61.92445373535156, "learning_rate": 2.3741268501935212e-06, "loss": 0.4554, "step": 20280 }, { "epoch": 40.62, "grad_norm": 85.12369537353516, "learning_rate": 2.3607724402746685e-06, "loss": 0.4314, "step": 20310 }, { "epoch": 40.68, "grad_norm": 42.598114013671875, "learning_rate": 2.3474440784663287e-06, "loss": 0.4402, "step": 20340 }, { "epoch": 40.74, "grad_norm": 29.042329788208008, "learning_rate": 2.334141896314057e-06, "loss": 0.4106, "step": 20370 }, { "epoch": 40.8, "grad_norm": 38.11594772338867, "learning_rate": 2.320866025105016e-06, "loss": 0.4315, "step": 20400 }, { "epoch": 40.86, "grad_norm": 61.246238708496094, "learning_rate": 2.3076165958666992e-06, "loss": 0.3815, "step": 20430 }, { "epoch": 40.92, "grad_norm": 31.141773223876953, "learning_rate": 2.294393739365621e-06, "loss": 0.4318, "step": 20460 }, { "epoch": 40.98, "grad_norm": 45.657249450683594, "learning_rate": 2.281197586106037e-06, "loss": 0.3763, "step": 20490 }, { "epoch": 41.0, "eval_loss": 0.30546829104423523, "eval_map": 0.7876, "eval_map_50": 0.956, "eval_map_75": 0.9186, "eval_map_chicken": 0.7973, "eval_map_duck": 0.7394, "eval_map_large": 0.8844, "eval_map_medium": 0.7824, "eval_map_plant": 0.8262, "eval_map_small": 0.1841, "eval_mar_1": 0.3033, "eval_mar_10": 0.8207, "eval_mar_100": 0.8254, "eval_mar_100_chicken": 0.8356, "eval_mar_100_duck": 0.7691, "eval_mar_100_plant": 0.8715, "eval_mar_large": 0.9234, "eval_mar_medium": 0.8339, "eval_mar_small": 0.3061, "eval_runtime": 5.1002, "eval_samples_per_second": 19.607, "eval_steps_per_second": 2.549, "step": 20500 }, { "epoch": 41.04, "grad_norm": 45.896121978759766, "learning_rate": 2.268028266328655e-06, "loss": 0.4273, "step": 20520 }, { "epoch": 41.1, "grad_norm": 25.360084533691406, "learning_rate": 2.254885910009341e-06, "loss": 0.4682, "step": 20550 }, { "epoch": 41.16, "grad_norm": 63.324825286865234, "learning_rate": 2.2417706468578495e-06, "loss": 0.6033, "step": 20580 }, { "epoch": 41.22, "grad_norm": 129.3037109375, "learning_rate": 2.228682606316529e-06, "loss": 0.5746, "step": 20610 }, { "epoch": 41.28, "grad_norm": 52.51323699951172, "learning_rate": 2.2156219175590623e-06, "loss": 0.4579, "step": 20640 }, { "epoch": 41.34, "grad_norm": 36.566917419433594, "learning_rate": 2.2025887094891657e-06, "loss": 0.4206, "step": 20670 }, { "epoch": 41.4, "grad_norm": 68.68453979492188, "learning_rate": 2.1895831107393485e-06, "loss": 0.4617, "step": 20700 }, { "epoch": 41.46, "grad_norm": 133.7510223388672, "learning_rate": 2.1766052496696155e-06, "loss": 0.5263, "step": 20730 }, { "epoch": 41.52, "grad_norm": 76.5693130493164, "learning_rate": 2.1636552543662187e-06, "loss": 0.4473, "step": 20760 }, { "epoch": 41.58, "grad_norm": 60.44133377075195, "learning_rate": 2.1507332526403814e-06, "loss": 0.4135, "step": 20790 }, { "epoch": 41.64, "grad_norm": 117.59391021728516, "learning_rate": 2.137839372027047e-06, "loss": 0.4654, "step": 20820 }, { "epoch": 41.7, "grad_norm": 45.36744689941406, "learning_rate": 2.124973739783609e-06, "loss": 0.4071, "step": 20850 }, { "epoch": 41.76, "grad_norm": 57.2125358581543, "learning_rate": 2.112136482888663e-06, "loss": 0.3865, "step": 20880 }, { "epoch": 41.82, "grad_norm": 60.10706329345703, "learning_rate": 2.0993277280407547e-06, "loss": 0.4395, "step": 20910 }, { "epoch": 41.88, "grad_norm": 76.14381408691406, "learning_rate": 2.0865476016571206e-06, "loss": 0.4623, "step": 20940 }, { "epoch": 41.94, "grad_norm": 47.56647491455078, "learning_rate": 2.0737962298724513e-06, "loss": 0.3841, "step": 20970 }, { "epoch": 42.0, "grad_norm": 85.08351135253906, "learning_rate": 2.061073738537635e-06, "loss": 0.5658, "step": 21000 }, { "epoch": 42.0, "eval_loss": 0.30137816071510315, "eval_map": 0.791, "eval_map_50": 0.9594, "eval_map_75": 0.9167, "eval_map_chicken": 0.805, "eval_map_duck": 0.7421, "eval_map_large": 0.8786, "eval_map_medium": 0.7911, "eval_map_plant": 0.8259, "eval_map_small": 0.2095, "eval_mar_1": 0.3032, "eval_mar_10": 0.8244, "eval_mar_100": 0.8299, "eval_mar_100_chicken": 0.8404, "eval_mar_100_duck": 0.7742, "eval_mar_100_plant": 0.8749, "eval_mar_large": 0.9213, "eval_mar_medium": 0.8403, "eval_mar_small": 0.3403, "eval_runtime": 5.0741, "eval_samples_per_second": 19.708, "eval_steps_per_second": 2.562, "step": 21000 }, { "epoch": 42.06, "grad_norm": 41.583213806152344, "learning_rate": 2.0483802532185286e-06, "loss": 0.4022, "step": 21030 }, { "epoch": 42.12, "grad_norm": 320.62518310546875, "learning_rate": 2.035715899194704e-06, "loss": 0.4408, "step": 21060 }, { "epoch": 42.18, "grad_norm": 42.51158142089844, "learning_rate": 2.0230808014582265e-06, "loss": 0.4566, "step": 21090 }, { "epoch": 42.24, "grad_norm": 0.00034786213655024767, "learning_rate": 2.0104750847124075e-06, "loss": 0.5319, "step": 21120 }, { "epoch": 42.3, "grad_norm": 93.6717529296875, "learning_rate": 1.9978988733705807e-06, "loss": 0.4083, "step": 21150 }, { "epoch": 42.36, "grad_norm": 52.52644348144531, "learning_rate": 1.9853522915548777e-06, "loss": 0.4354, "step": 21180 }, { "epoch": 42.42, "grad_norm": 36.161460876464844, "learning_rate": 1.9728354630949935e-06, "loss": 0.4591, "step": 21210 }, { "epoch": 42.48, "grad_norm": 60.393306732177734, "learning_rate": 1.9603485115269743e-06, "loss": 0.5063, "step": 21240 }, { "epoch": 42.54, "grad_norm": 223.328857421875, "learning_rate": 1.9478915600919877e-06, "loss": 0.4404, "step": 21270 }, { "epoch": 42.6, "grad_norm": 42.48649215698242, "learning_rate": 1.9354647317351187e-06, "loss": 0.4508, "step": 21300 }, { "epoch": 42.66, "grad_norm": 46.062191009521484, "learning_rate": 1.9230681491041425e-06, "loss": 0.4275, "step": 21330 }, { "epoch": 42.72, "grad_norm": 0.0008085273439064622, "learning_rate": 1.910701934548329e-06, "loss": 0.4588, "step": 21360 }, { "epoch": 42.78, "grad_norm": 44.36118698120117, "learning_rate": 1.8983662101172217e-06, "loss": 0.4563, "step": 21390 }, { "epoch": 42.84, "grad_norm": 139.61676025390625, "learning_rate": 1.8860610975594384e-06, "loss": 0.3606, "step": 21420 }, { "epoch": 42.9, "grad_norm": 37.38964080810547, "learning_rate": 1.873786718321476e-06, "loss": 0.4464, "step": 21450 }, { "epoch": 42.96, "grad_norm": 72.3614730834961, "learning_rate": 1.8615431935464984e-06, "loss": 0.4322, "step": 21480 }, { "epoch": 43.0, "eval_loss": 0.29740211367607117, "eval_map": 0.7974, "eval_map_50": 0.9595, "eval_map_75": 0.9169, "eval_map_chicken": 0.8005, "eval_map_duck": 0.7586, "eval_map_large": 0.8951, "eval_map_medium": 0.7927, "eval_map_plant": 0.8331, "eval_map_small": 0.1879, "eval_mar_1": 0.3078, "eval_mar_10": 0.8296, "eval_mar_100": 0.834, "eval_mar_100_chicken": 0.8369, "eval_mar_100_duck": 0.7876, "eval_mar_100_plant": 0.8775, "eval_mar_large": 0.931, "eval_mar_medium": 0.8411, "eval_mar_small": 0.3085, "eval_runtime": 5.6419, "eval_samples_per_second": 17.724, "eval_steps_per_second": 2.304, "step": 21500 }, { "epoch": 43.02, "grad_norm": 44.15309143066406, "learning_rate": 1.8493306440731557e-06, "loss": 0.4896, "step": 21510 }, { "epoch": 43.08, "grad_norm": 35.48102951049805, "learning_rate": 1.837149190434378e-06, "loss": 0.5013, "step": 21540 }, { "epoch": 43.14, "grad_norm": 35.87041473388672, "learning_rate": 1.824998952856198e-06, "loss": 0.4439, "step": 21570 }, { "epoch": 43.2, "grad_norm": 26.650522232055664, "learning_rate": 1.8128800512565514e-06, "loss": 0.4186, "step": 21600 }, { "epoch": 43.26, "grad_norm": 48.30433654785156, "learning_rate": 1.800792605244109e-06, "loss": 0.4345, "step": 21630 }, { "epoch": 43.32, "grad_norm": 70.63233184814453, "learning_rate": 1.7887367341170781e-06, "loss": 0.4639, "step": 21660 }, { "epoch": 43.38, "grad_norm": 29.950109481811523, "learning_rate": 1.7767125568620442e-06, "loss": 0.3931, "step": 21690 }, { "epoch": 43.44, "grad_norm": 40.98532485961914, "learning_rate": 1.7647201921527802e-06, "loss": 0.3728, "step": 21720 }, { "epoch": 43.5, "grad_norm": 107.21430969238281, "learning_rate": 1.7527597583490825e-06, "loss": 0.3679, "step": 21750 }, { "epoch": 43.56, "grad_norm": 41.53556442260742, "learning_rate": 1.7408313734956074e-06, "loss": 0.4278, "step": 21780 }, { "epoch": 43.62, "grad_norm": 30.475116729736328, "learning_rate": 1.7289351553206952e-06, "loss": 0.4995, "step": 21810 }, { "epoch": 43.68, "grad_norm": 65.69325256347656, "learning_rate": 1.7170712212352187e-06, "loss": 0.4236, "step": 21840 }, { "epoch": 43.74, "grad_norm": 83.24858856201172, "learning_rate": 1.7052396883314154e-06, "loss": 0.4865, "step": 21870 }, { "epoch": 43.8, "grad_norm": 49.75985336303711, "learning_rate": 1.6934406733817417e-06, "loss": 0.4061, "step": 21900 }, { "epoch": 43.86, "grad_norm": 0.0012297651264816523, "learning_rate": 1.6816742928377072e-06, "loss": 0.4391, "step": 21930 }, { "epoch": 43.92, "grad_norm": 107.39283752441406, "learning_rate": 1.6699406628287423e-06, "loss": 0.4027, "step": 21960 }, { "epoch": 43.98, "grad_norm": 53.299110412597656, "learning_rate": 1.658239899161036e-06, "loss": 0.7057, "step": 21990 }, { "epoch": 44.0, "eval_loss": 0.3092344403266907, "eval_map": 0.7822, "eval_map_50": 0.9563, "eval_map_75": 0.9171, "eval_map_chicken": 0.7941, "eval_map_duck": 0.7348, "eval_map_large": 0.8688, "eval_map_medium": 0.7813, "eval_map_plant": 0.8177, "eval_map_small": 0.1985, "eval_mar_1": 0.3003, "eval_mar_10": 0.8165, "eval_mar_100": 0.821, "eval_mar_100_chicken": 0.8307, "eval_mar_100_duck": 0.766, "eval_mar_100_plant": 0.8663, "eval_mar_large": 0.9117, "eval_mar_medium": 0.8292, "eval_mar_small": 0.3663, "eval_runtime": 5.0773, "eval_samples_per_second": 19.696, "eval_steps_per_second": 2.56, "step": 22000 }, { "epoch": 44.04, "grad_norm": 42.234928131103516, "learning_rate": 1.6465721173164e-06, "loss": 0.4139, "step": 22020 }, { "epoch": 44.1, "grad_norm": 57.58454513549805, "learning_rate": 1.6349374324511347e-06, "loss": 0.4395, "step": 22050 }, { "epoch": 44.16, "grad_norm": 57.831993103027344, "learning_rate": 1.6233359593948777e-06, "loss": 0.4128, "step": 22080 }, { "epoch": 44.22, "grad_norm": 57.68543243408203, "learning_rate": 1.6117678126494895e-06, "loss": 0.4225, "step": 22110 }, { "epoch": 44.28, "grad_norm": 168.56692504882812, "learning_rate": 1.600233106387904e-06, "loss": 0.423, "step": 22140 }, { "epoch": 44.34, "grad_norm": 39.12761306762695, "learning_rate": 1.5887319544530182e-06, "loss": 0.3617, "step": 22170 }, { "epoch": 44.4, "grad_norm": 41.760311126708984, "learning_rate": 1.5772644703565564e-06, "loss": 0.6029, "step": 22200 }, { "epoch": 44.46, "grad_norm": 79.56449127197266, "learning_rate": 1.5658307672779594e-06, "loss": 0.3154, "step": 22230 }, { "epoch": 44.52, "grad_norm": 35.965431213378906, "learning_rate": 1.554430958063259e-06, "loss": 0.4407, "step": 22260 }, { "epoch": 44.58, "grad_norm": 54.796878814697266, "learning_rate": 1.5430651552239684e-06, "loss": 0.4, "step": 22290 }, { "epoch": 44.64, "grad_norm": 64.1689682006836, "learning_rate": 1.531733470935976e-06, "loss": 0.4755, "step": 22320 }, { "epoch": 44.7, "grad_norm": 36.782920837402344, "learning_rate": 1.5204360170384286e-06, "loss": 0.4451, "step": 22350 }, { "epoch": 44.76, "grad_norm": 38.28982162475586, "learning_rate": 1.5091729050326376e-06, "loss": 0.4116, "step": 22380 }, { "epoch": 44.82, "grad_norm": 36.69734191894531, "learning_rate": 1.4979442460809684e-06, "loss": 0.4304, "step": 22410 }, { "epoch": 44.88, "grad_norm": 34.10408020019531, "learning_rate": 1.4867501510057548e-06, "loss": 0.4208, "step": 22440 }, { "epoch": 44.94, "grad_norm": 56.05753707885742, "learning_rate": 1.4755907302881927e-06, "loss": 0.4207, "step": 22470 }, { "epoch": 45.0, "grad_norm": 79.50679779052734, "learning_rate": 1.4644660940672628e-06, "loss": 0.4096, "step": 22500 }, { "epoch": 45.0, "eval_loss": 0.29910051822662354, "eval_map": 0.7899, "eval_map_50": 0.9614, "eval_map_75": 0.9121, "eval_map_chicken": 0.8016, "eval_map_duck": 0.7502, "eval_map_large": 0.8747, "eval_map_medium": 0.7852, "eval_map_plant": 0.8179, "eval_map_small": 0.2212, "eval_mar_1": 0.3031, "eval_mar_10": 0.8233, "eval_mar_100": 0.8286, "eval_mar_100_chicken": 0.8413, "eval_mar_100_duck": 0.7794, "eval_mar_100_plant": 0.8651, "eval_mar_large": 0.9142, "eval_mar_medium": 0.8351, "eval_mar_small": 0.3578, "eval_runtime": 5.1133, "eval_samples_per_second": 19.557, "eval_steps_per_second": 2.542, "step": 22500 }, { "epoch": 45.06, "grad_norm": 38.6081428527832, "learning_rate": 1.4533763521386319e-06, "loss": 0.392, "step": 22530 }, { "epoch": 45.12, "grad_norm": 28.41141128540039, "learning_rate": 1.4423216139535735e-06, "loss": 0.4145, "step": 22560 }, { "epoch": 45.18, "grad_norm": 91.0741195678711, "learning_rate": 1.4313019886178942e-06, "loss": 0.4022, "step": 22590 }, { "epoch": 45.24, "grad_norm": 88.55020141601562, "learning_rate": 1.420317584890844e-06, "loss": 0.5098, "step": 22620 }, { "epoch": 45.3, "grad_norm": 59.97364044189453, "learning_rate": 1.4093685111840567e-06, "loss": 0.4416, "step": 22650 }, { "epoch": 45.36, "grad_norm": 138.7408447265625, "learning_rate": 1.3984548755604655e-06, "loss": 0.4223, "step": 22680 }, { "epoch": 45.42, "grad_norm": 41.95036315917969, "learning_rate": 1.3875767857332512e-06, "loss": 0.4241, "step": 22710 }, { "epoch": 45.48, "grad_norm": 35.16947937011719, "learning_rate": 1.3767343490647668e-06, "loss": 0.4442, "step": 22740 }, { "epoch": 45.54, "grad_norm": 69.71556091308594, "learning_rate": 1.3659276725654863e-06, "loss": 0.3552, "step": 22770 }, { "epoch": 45.6, "grad_norm": 95.909423828125, "learning_rate": 1.3551568628929434e-06, "loss": 0.4363, "step": 22800 }, { "epoch": 45.66, "grad_norm": 21.66033935546875, "learning_rate": 1.3444220263506797e-06, "loss": 0.4363, "step": 22830 }, { "epoch": 45.72, "grad_norm": 131.8041229248047, "learning_rate": 1.333723268887201e-06, "loss": 0.4592, "step": 22860 }, { "epoch": 45.78, "grad_norm": 50.998779296875, "learning_rate": 1.3230606960949204e-06, "loss": 0.4649, "step": 22890 }, { "epoch": 45.84, "grad_norm": 29.139339447021484, "learning_rate": 1.312434413209131e-06, "loss": 0.4568, "step": 22920 }, { "epoch": 45.9, "grad_norm": 51.54317092895508, "learning_rate": 1.301844525106951e-06, "loss": 0.4308, "step": 22950 }, { "epoch": 45.96, "grad_norm": 46.99152374267578, "learning_rate": 1.2912911363063048e-06, "loss": 0.4854, "step": 22980 }, { "epoch": 46.0, "eval_loss": 0.3003343343734741, "eval_map": 0.7815, "eval_map_50": 0.9595, "eval_map_75": 0.9068, "eval_map_chicken": 0.7816, "eval_map_duck": 0.746, "eval_map_large": 0.8747, "eval_map_medium": 0.7791, "eval_map_plant": 0.8169, "eval_map_small": 0.2042, "eval_mar_1": 0.3016, "eval_mar_10": 0.8164, "eval_mar_100": 0.8197, "eval_mar_100_chicken": 0.8231, "eval_mar_100_duck": 0.7722, "eval_mar_100_plant": 0.8637, "eval_mar_large": 0.9163, "eval_mar_medium": 0.8255, "eval_mar_small": 0.3258, "eval_runtime": 5.0277, "eval_samples_per_second": 19.89, "eval_steps_per_second": 2.586, "step": 23000 }, { "epoch": 46.02, "grad_norm": 82.24079132080078, "learning_rate": 1.2807743509648745e-06, "loss": 0.459, "step": 23010 }, { "epoch": 46.08, "grad_norm": 35.353336334228516, "learning_rate": 1.2702942728790897e-06, "loss": 0.4215, "step": 23040 }, { "epoch": 46.14, "grad_norm": 38.322479248046875, "learning_rate": 1.2598510054830888e-06, "loss": 0.3925, "step": 23070 }, { "epoch": 46.2, "grad_norm": 53.787445068359375, "learning_rate": 1.2494446518477022e-06, "loss": 0.349, "step": 23100 }, { "epoch": 46.26, "grad_norm": 37.92025375366211, "learning_rate": 1.2390753146794438e-06, "loss": 0.3578, "step": 23130 }, { "epoch": 46.32, "grad_norm": 68.19427490234375, "learning_rate": 1.2287430963194807e-06, "loss": 0.4342, "step": 23160 }, { "epoch": 46.38, "grad_norm": 108.89007568359375, "learning_rate": 1.218448098742641e-06, "loss": 0.4607, "step": 23190 }, { "epoch": 46.44, "grad_norm": 83.83390808105469, "learning_rate": 1.2081904235563908e-06, "loss": 0.4169, "step": 23220 }, { "epoch": 46.5, "grad_norm": 46.47811508178711, "learning_rate": 1.1979701719998454e-06, "loss": 0.3965, "step": 23250 }, { "epoch": 46.56, "grad_norm": 83.35205841064453, "learning_rate": 1.18778744494276e-06, "loss": 0.685, "step": 23280 }, { "epoch": 46.62, "grad_norm": 61.895530700683594, "learning_rate": 1.1776423428845423e-06, "loss": 0.3723, "step": 23310 }, { "epoch": 46.68, "grad_norm": 68.6615982055664, "learning_rate": 1.1675349659532514e-06, "loss": 0.4277, "step": 23340 }, { "epoch": 46.74, "grad_norm": 34.00867462158203, "learning_rate": 1.1574654139046171e-06, "loss": 0.4321, "step": 23370 }, { "epoch": 46.8, "grad_norm": 40.27052688598633, "learning_rate": 1.1474337861210543e-06, "loss": 0.3798, "step": 23400 }, { "epoch": 46.86, "grad_norm": 58.309085845947266, "learning_rate": 1.1374401816106778e-06, "loss": 0.4083, "step": 23430 }, { "epoch": 46.92, "grad_norm": 43.79540252685547, "learning_rate": 1.1274846990063314e-06, "loss": 0.3961, "step": 23460 }, { "epoch": 46.98, "grad_norm": 48.5699462890625, "learning_rate": 1.1175674365646067e-06, "loss": 0.4257, "step": 23490 }, { "epoch": 47.0, "eval_loss": 0.29506856203079224, "eval_map": 0.792, "eval_map_50": 0.9625, "eval_map_75": 0.9172, "eval_map_chicken": 0.7961, "eval_map_duck": 0.7572, "eval_map_large": 0.8802, "eval_map_medium": 0.7855, "eval_map_plant": 0.8226, "eval_map_small": 0.2075, "eval_mar_1": 0.3067, "eval_mar_10": 0.8262, "eval_mar_100": 0.8309, "eval_mar_100_chicken": 0.8338, "eval_mar_100_duck": 0.7907, "eval_mar_100_plant": 0.8683, "eval_mar_large": 0.9197, "eval_mar_medium": 0.836, "eval_mar_small": 0.3468, "eval_runtime": 5.0742, "eval_samples_per_second": 19.708, "eval_steps_per_second": 2.562, "step": 23500 }, { "epoch": 47.04, "grad_norm": 61.57620620727539, "learning_rate": 1.1076884921648834e-06, "loss": 0.3394, "step": 23520 }, { "epoch": 47.1, "grad_norm": 46.27333450317383, "learning_rate": 1.097847963308351e-06, "loss": 0.4013, "step": 23550 }, { "epoch": 47.16, "grad_norm": 75.60147857666016, "learning_rate": 1.0880459471170597e-06, "loss": 0.337, "step": 23580 }, { "epoch": 47.22, "grad_norm": 41.4156608581543, "learning_rate": 1.0782825403329488e-06, "loss": 0.3904, "step": 23610 }, { "epoch": 47.28, "grad_norm": 35.6782341003418, "learning_rate": 1.0685578393169054e-06, "loss": 0.4262, "step": 23640 }, { "epoch": 47.34, "grad_norm": 34.51017761230469, "learning_rate": 1.0588719400478004e-06, "loss": 0.4002, "step": 23670 }, { "epoch": 47.4, "grad_norm": 33.08877944946289, "learning_rate": 1.049224938121548e-06, "loss": 0.4203, "step": 23700 }, { "epoch": 47.46, "grad_norm": 32.152339935302734, "learning_rate": 1.0396169287501652e-06, "loss": 0.3937, "step": 23730 }, { "epoch": 47.52, "grad_norm": 53.18661117553711, "learning_rate": 1.0300480067608232e-06, "loss": 0.4445, "step": 23760 }, { "epoch": 47.58, "grad_norm": 40.39225387573242, "learning_rate": 1.020518266594921e-06, "loss": 0.4166, "step": 23790 }, { "epoch": 47.64, "grad_norm": 42.8251838684082, "learning_rate": 1.0110278023071445e-06, "loss": 0.414, "step": 23820 }, { "epoch": 47.7, "grad_norm": 64.0047607421875, "learning_rate": 1.0015767075645472e-06, "loss": 0.328, "step": 23850 }, { "epoch": 47.76, "grad_norm": 52.580780029296875, "learning_rate": 9.921650756456164e-07, "loss": 0.4109, "step": 23880 }, { "epoch": 47.82, "grad_norm": 59.67039489746094, "learning_rate": 9.82792999439362e-07, "loss": 0.4171, "step": 23910 }, { "epoch": 47.88, "grad_norm": 179.34124755859375, "learning_rate": 9.734605714443906e-07, "loss": 0.4743, "step": 23940 }, { "epoch": 47.94, "grad_norm": 53.743431091308594, "learning_rate": 9.641678837679985e-07, "loss": 0.4152, "step": 23970 }, { "epoch": 48.0, "grad_norm": 46.56321716308594, "learning_rate": 9.549150281252633e-07, "loss": 0.4033, "step": 24000 }, { "epoch": 48.0, "eval_loss": 0.28829237818717957, "eval_map": 0.7988, "eval_map_50": 0.9632, "eval_map_75": 0.9194, "eval_map_chicken": 0.8069, "eval_map_duck": 0.7649, "eval_map_large": 0.8765, "eval_map_medium": 0.7984, "eval_map_plant": 0.8246, "eval_map_small": 0.2266, "eval_mar_1": 0.3082, "eval_mar_10": 0.8343, "eval_mar_100": 0.8382, "eval_mar_100_chicken": 0.8458, "eval_mar_100_duck": 0.7969, "eval_mar_100_plant": 0.872, "eval_mar_large": 0.9176, "eval_mar_medium": 0.8477, "eval_mar_small": 0.3616, "eval_runtime": 5.0852, "eval_samples_per_second": 19.665, "eval_steps_per_second": 2.556, "step": 24000 }, { "epoch": 48.06, "grad_norm": 33.844398498535156, "learning_rate": 9.457020958381324e-07, "loss": 0.3829, "step": 24030 }, { "epoch": 48.12, "grad_norm": 75.94850158691406, "learning_rate": 9.365291778345303e-07, "loss": 0.4371, "step": 24060 }, { "epoch": 48.18, "grad_norm": 40.99359893798828, "learning_rate": 9.273963646474527e-07, "loss": 0.456, "step": 24090 }, { "epoch": 48.24, "grad_norm": 57.59867477416992, "learning_rate": 9.183037464140804e-07, "loss": 0.4523, "step": 24120 }, { "epoch": 48.3, "grad_norm": 142.89874267578125, "learning_rate": 9.09251412874882e-07, "loss": 0.3649, "step": 24150 }, { "epoch": 48.36, "grad_norm": 67.51494598388672, "learning_rate": 9.002394533727382e-07, "loss": 0.4477, "step": 24180 }, { "epoch": 48.42, "grad_norm": 82.09522247314453, "learning_rate": 8.912679568520494e-07, "loss": 0.4224, "step": 24210 }, { "epoch": 48.48, "grad_norm": 54.342594146728516, "learning_rate": 8.823370118578628e-07, "loss": 0.4375, "step": 24240 }, { "epoch": 48.54, "grad_norm": 137.6064910888672, "learning_rate": 8.734467065350022e-07, "loss": 0.4574, "step": 24270 }, { "epoch": 48.6, "grad_norm": 64.60173797607422, "learning_rate": 8.645971286271903e-07, "loss": 0.4518, "step": 24300 }, { "epoch": 48.66, "grad_norm": 45.69334411621094, "learning_rate": 8.557883654761906e-07, "loss": 0.404, "step": 24330 }, { "epoch": 48.72, "grad_norm": 179.41268920898438, "learning_rate": 8.470205040209362e-07, "loss": 0.4592, "step": 24360 }, { "epoch": 48.78, "grad_norm": 52.23598098754883, "learning_rate": 8.382936307966838e-07, "loss": 0.4067, "step": 24390 }, { "epoch": 48.84, "grad_norm": 73.33792114257812, "learning_rate": 8.296078319341444e-07, "loss": 0.4185, "step": 24420 }, { "epoch": 48.9, "grad_norm": 78.52240753173828, "learning_rate": 8.209631931586499e-07, "loss": 0.3914, "step": 24450 }, { "epoch": 48.96, "grad_norm": 59.30632781982422, "learning_rate": 8.123597997892918e-07, "loss": 0.4932, "step": 24480 }, { "epoch": 49.0, "eval_loss": 0.3021915555000305, "eval_map": 0.7844, "eval_map_50": 0.9617, "eval_map_75": 0.9101, "eval_map_chicken": 0.7882, "eval_map_duck": 0.7472, "eval_map_large": 0.8762, "eval_map_medium": 0.7765, "eval_map_plant": 0.8177, "eval_map_small": 0.2231, "eval_mar_1": 0.3007, "eval_mar_10": 0.8216, "eval_mar_100": 0.8252, "eval_mar_100_chicken": 0.8293, "eval_mar_100_duck": 0.7794, "eval_mar_100_plant": 0.8669, "eval_mar_large": 0.9176, "eval_mar_medium": 0.8308, "eval_mar_small": 0.3396, "eval_runtime": 5.0276, "eval_samples_per_second": 19.89, "eval_steps_per_second": 2.586, "step": 24500 }, { "epoch": 49.02, "grad_norm": 119.42558288574219, "learning_rate": 8.037977367380922e-07, "loss": 0.4811, "step": 24510 }, { "epoch": 49.08, "grad_norm": 0.00024352494801860303, "learning_rate": 7.952770885091548e-07, "loss": 0.3779, "step": 24540 }, { "epoch": 49.14, "grad_norm": 67.42436981201172, "learning_rate": 7.867979391978398e-07, "loss": 0.3558, "step": 24570 }, { "epoch": 49.2, "grad_norm": 92.31123352050781, "learning_rate": 7.783603724899258e-07, "loss": 0.4426, "step": 24600 }, { "epoch": 49.26, "grad_norm": 48.806907653808594, "learning_rate": 7.699644716607896e-07, "loss": 0.3877, "step": 24630 }, { "epoch": 49.32, "grad_norm": 27.726848602294922, "learning_rate": 7.61610319574585e-07, "loss": 0.3929, "step": 24660 }, { "epoch": 49.38, "grad_norm": 50.71929168701172, "learning_rate": 7.532979986834177e-07, "loss": 0.3916, "step": 24690 }, { "epoch": 49.44, "grad_norm": 38.81157684326172, "learning_rate": 7.450275910265415e-07, "loss": 0.3922, "step": 24720 }, { "epoch": 49.5, "grad_norm": 52.464599609375, "learning_rate": 7.367991782295392e-07, "loss": 0.4487, "step": 24750 }, { "epoch": 49.56, "grad_norm": 48.69332504272461, "learning_rate": 7.286128415035249e-07, "loss": 0.4287, "step": 24780 }, { "epoch": 49.62, "grad_norm": 50.46269226074219, "learning_rate": 7.204686616443352e-07, "loss": 0.3933, "step": 24810 }, { "epoch": 49.68, "grad_norm": 66.0242691040039, "learning_rate": 7.123667190317396e-07, "loss": 0.3534, "step": 24840 }, { "epoch": 49.74, "grad_norm": 77.78071594238281, "learning_rate": 7.043070936286395e-07, "loss": 0.3834, "step": 24870 }, { "epoch": 49.8, "grad_norm": 49.89218521118164, "learning_rate": 6.962898649802824e-07, "loss": 0.4152, "step": 24900 }, { "epoch": 49.86, "grad_norm": 47.149166107177734, "learning_rate": 6.883151122134812e-07, "loss": 0.4798, "step": 24930 }, { "epoch": 49.92, "grad_norm": 42.12199020385742, "learning_rate": 6.803829140358237e-07, "loss": 0.5189, "step": 24960 }, { "epoch": 49.98, "grad_norm": 53.24802780151367, "learning_rate": 6.724933487349061e-07, "loss": 0.3758, "step": 24990 }, { "epoch": 50.0, "eval_loss": 0.29586249589920044, "eval_map": 0.7921, "eval_map_50": 0.9609, "eval_map_75": 0.9203, "eval_map_chicken": 0.7932, "eval_map_duck": 0.7619, "eval_map_large": 0.8779, "eval_map_medium": 0.7853, "eval_map_plant": 0.8212, "eval_map_small": 0.2432, "eval_mar_1": 0.3066, "eval_mar_10": 0.8273, "eval_mar_100": 0.8314, "eval_mar_100_chicken": 0.832, "eval_mar_100_duck": 0.7918, "eval_mar_100_plant": 0.8703, "eval_mar_large": 0.9197, "eval_mar_medium": 0.8365, "eval_mar_small": 0.3655, "eval_runtime": 5.0566, "eval_samples_per_second": 19.776, "eval_steps_per_second": 2.571, "step": 25000 }, { "epoch": 50.04, "grad_norm": 88.88943481445312, "learning_rate": 6.646464941775499e-07, "loss": 0.4487, "step": 25020 }, { "epoch": 50.1, "grad_norm": 51.90554428100586, "learning_rate": 6.568424278090446e-07, "loss": 0.3981, "step": 25050 }, { "epoch": 50.16, "grad_norm": 53.483455657958984, "learning_rate": 6.490812266523716e-07, "loss": 0.3775, "step": 25080 }, { "epoch": 50.22, "grad_norm": 49.997982025146484, "learning_rate": 6.413629673074562e-07, "loss": 0.4164, "step": 25110 }, { "epoch": 50.28, "grad_norm": 55.87346267700195, "learning_rate": 6.336877259504004e-07, "loss": 0.3653, "step": 25140 }, { "epoch": 50.34, "grad_norm": 85.9616470336914, "learning_rate": 6.260555783327366e-07, "loss": 0.4081, "step": 25170 }, { "epoch": 50.4, "grad_norm": 95.91594696044922, "learning_rate": 6.184665997806832e-07, "loss": 0.4766, "step": 25200 }, { "epoch": 50.46, "grad_norm": 52.188880920410156, "learning_rate": 6.109208651943921e-07, "loss": 0.4127, "step": 25230 }, { "epoch": 50.52, "grad_norm": 146.0522003173828, "learning_rate": 6.034184490472195e-07, "loss": 0.339, "step": 25260 }, { "epoch": 50.58, "grad_norm": 63.30977249145508, "learning_rate": 5.959594253849821e-07, "loss": 0.4051, "step": 25290 }, { "epoch": 50.64, "grad_norm": 45.95663070678711, "learning_rate": 5.885438678252342e-07, "loss": 0.4141, "step": 25320 }, { "epoch": 50.7, "grad_norm": 194.88026428222656, "learning_rate": 5.811718495565327e-07, "loss": 0.3736, "step": 25350 }, { "epoch": 50.76, "grad_norm": 47.18809509277344, "learning_rate": 5.738434433377244e-07, "loss": 0.4111, "step": 25380 }, { "epoch": 50.82, "grad_norm": 21.77028465270996, "learning_rate": 5.665587214972173e-07, "loss": 0.4393, "step": 25410 }, { "epoch": 50.88, "grad_norm": 107.16293334960938, "learning_rate": 5.593177559322776e-07, "loss": 0.3947, "step": 25440 }, { "epoch": 50.94, "grad_norm": 60.57902526855469, "learning_rate": 5.521206181083111e-07, "loss": 0.5372, "step": 25470 }, { "epoch": 51.0, "grad_norm": 33.81594467163086, "learning_rate": 5.449673790581611e-07, "loss": 0.4397, "step": 25500 }, { "epoch": 51.0, "eval_loss": 0.2871440052986145, "eval_map": 0.7983, "eval_map_50": 0.9609, "eval_map_75": 0.9128, "eval_map_chicken": 0.802, "eval_map_duck": 0.7648, "eval_map_large": 0.8832, "eval_map_medium": 0.7966, "eval_map_plant": 0.828, "eval_map_small": 0.2145, "eval_mar_1": 0.3086, "eval_mar_10": 0.833, "eval_mar_100": 0.8374, "eval_mar_100_chicken": 0.8369, "eval_mar_100_duck": 0.7969, "eval_mar_100_plant": 0.8784, "eval_mar_large": 0.9251, "eval_mar_medium": 0.8478, "eval_mar_small": 0.3409, "eval_runtime": 5.1551, "eval_samples_per_second": 19.398, "eval_steps_per_second": 2.522, "step": 25500 }, { "epoch": 51.06, "grad_norm": 61.52519607543945, "learning_rate": 5.378581093814112e-07, "loss": 0.3936, "step": 25530 }, { "epoch": 51.12, "grad_norm": 41.62113952636719, "learning_rate": 5.307928792436812e-07, "loss": 0.3472, "step": 25560 }, { "epoch": 51.18, "grad_norm": 58.78872299194336, "learning_rate": 5.237717583759421e-07, "loss": 0.4171, "step": 25590 }, { "epoch": 51.24, "grad_norm": 71.37984466552734, "learning_rate": 5.167948160738206e-07, "loss": 0.3807, "step": 25620 }, { "epoch": 51.3, "grad_norm": 30.988309860229492, "learning_rate": 5.098621211969224e-07, "loss": 0.4499, "step": 25650 }, { "epoch": 51.36, "grad_norm": 90.97999572753906, "learning_rate": 5.029737421681446e-07, "loss": 0.406, "step": 25680 }, { "epoch": 51.42, "grad_norm": 39.365169525146484, "learning_rate": 4.961297469730097e-07, "loss": 0.4401, "step": 25710 }, { "epoch": 51.48, "grad_norm": 56.183563232421875, "learning_rate": 4.893302031589864e-07, "loss": 0.4249, "step": 25740 }, { "epoch": 51.54, "grad_norm": 35.67009353637695, "learning_rate": 4.825751778348259e-07, "loss": 0.4689, "step": 25770 }, { "epoch": 51.6, "grad_norm": 68.61273956298828, "learning_rate": 4.758647376699033e-07, "loss": 0.3953, "step": 25800 }, { "epoch": 51.66, "grad_norm": 39.2368049621582, "learning_rate": 4.691989488935511e-07, "loss": 0.4341, "step": 25830 }, { "epoch": 51.72, "grad_norm": 40.57124710083008, "learning_rate": 4.625778772944156e-07, "loss": 0.3937, "step": 25860 }, { "epoch": 51.78, "grad_norm": 63.675323486328125, "learning_rate": 4.5600158821979933e-07, "loss": 0.3677, "step": 25890 }, { "epoch": 51.84, "grad_norm": 52.42002487182617, "learning_rate": 4.494701465750217e-07, "loss": 0.336, "step": 25920 }, { "epoch": 51.9, "grad_norm": 30.058719635009766, "learning_rate": 4.4298361682277355e-07, "loss": 0.4698, "step": 25950 }, { "epoch": 51.96, "grad_norm": 51.076725006103516, "learning_rate": 4.3654206298248625e-07, "loss": 0.3917, "step": 25980 }, { "epoch": 52.0, "eval_loss": 0.29068684577941895, "eval_map": 0.7955, "eval_map_50": 0.9645, "eval_map_75": 0.9161, "eval_map_chicken": 0.7975, "eval_map_duck": 0.7654, "eval_map_large": 0.8796, "eval_map_medium": 0.7911, "eval_map_plant": 0.8234, "eval_map_small": 0.2316, "eval_mar_1": 0.308, "eval_mar_10": 0.8314, "eval_mar_100": 0.8352, "eval_mar_100_chicken": 0.8356, "eval_mar_100_duck": 0.7969, "eval_mar_100_plant": 0.8732, "eval_mar_large": 0.9192, "eval_mar_medium": 0.8428, "eval_mar_small": 0.375, "eval_runtime": 5.0448, "eval_samples_per_second": 19.822, "eval_steps_per_second": 2.577, "step": 26000 }, { "epoch": 52.02, "grad_norm": 34.134273529052734, "learning_rate": 4.301455486296946e-07, "loss": 0.422, "step": 26010 }, { "epoch": 52.08, "grad_norm": 62.580841064453125, "learning_rate": 4.237941368954124e-07, "loss": 0.374, "step": 26040 }, { "epoch": 52.14, "grad_norm": 49.3266487121582, "learning_rate": 4.1748789046551055e-07, "loss": 0.384, "step": 26070 }, { "epoch": 52.2, "grad_norm": 0.00041551125468686223, "learning_rate": 4.112268715800943e-07, "loss": 0.4655, "step": 26100 }, { "epoch": 52.26, "grad_norm": 38.26332473754883, "learning_rate": 4.0501114203289395e-07, "loss": 0.3986, "step": 26130 }, { "epoch": 52.32, "grad_norm": 65.15966796875, "learning_rate": 3.9884076317064813e-07, "loss": 0.4129, "step": 26160 }, { "epoch": 52.38, "grad_norm": 74.6011962890625, "learning_rate": 3.9271579589250817e-07, "loss": 0.477, "step": 26190 }, { "epoch": 52.44, "grad_norm": 48.72752380371094, "learning_rate": 3.866363006494256e-07, "loss": 0.4237, "step": 26220 }, { "epoch": 52.5, "grad_norm": 39.035118103027344, "learning_rate": 3.8060233744356634e-07, "loss": 0.4287, "step": 26250 }, { "epoch": 52.56, "grad_norm": 54.2945556640625, "learning_rate": 3.7461396582771035e-07, "loss": 0.4003, "step": 26280 }, { "epoch": 52.62, "grad_norm": 59.89337921142578, "learning_rate": 3.6867124490466697e-07, "loss": 0.4809, "step": 26310 }, { "epoch": 52.68, "grad_norm": 32.89358139038086, "learning_rate": 3.627742333266937e-07, "loss": 0.3781, "step": 26340 }, { "epoch": 52.74, "grad_norm": 114.98311614990234, "learning_rate": 3.569229892949133e-07, "loss": 0.4946, "step": 26370 }, { "epoch": 52.8, "grad_norm": 62.90887451171875, "learning_rate": 3.511175705587433e-07, "loss": 0.4092, "step": 26400 }, { "epoch": 52.86, "grad_norm": 408.21044921875, "learning_rate": 3.4535803441532125e-07, "loss": 0.4111, "step": 26430 }, { "epoch": 52.92, "grad_norm": 35.12818145751953, "learning_rate": 3.396444377089453e-07, "loss": 0.4019, "step": 26460 }, { "epoch": 52.98, "grad_norm": 0.0001875197485787794, "learning_rate": 3.3397683683050685e-07, "loss": 0.3362, "step": 26490 }, { "epoch": 53.0, "eval_loss": 0.2884664237499237, "eval_map": 0.7989, "eval_map_50": 0.9644, "eval_map_75": 0.92, "eval_map_chicken": 0.8012, "eval_map_duck": 0.7703, "eval_map_large": 0.8789, "eval_map_medium": 0.7958, "eval_map_plant": 0.8253, "eval_map_small": 0.2324, "eval_mar_1": 0.3075, "eval_mar_10": 0.8338, "eval_mar_100": 0.8379, "eval_mar_100_chicken": 0.8382, "eval_mar_100_duck": 0.8, "eval_mar_100_plant": 0.8755, "eval_mar_large": 0.9201, "eval_mar_medium": 0.8465, "eval_mar_small": 0.3769, "eval_runtime": 5.0147, "eval_samples_per_second": 19.941, "eval_steps_per_second": 2.592, "step": 26500 }, { "epoch": 53.04, "grad_norm": 47.404518127441406, "learning_rate": 3.283552877169399e-07, "loss": 0.4292, "step": 26520 }, { "epoch": 53.1, "grad_norm": 52.7077751159668, "learning_rate": 3.227798458506637e-07, "loss": 0.3831, "step": 26550 }, { "epoch": 53.16, "grad_norm": 0.0004456727474462241, "learning_rate": 3.172505662590386e-07, "loss": 0.3576, "step": 26580 }, { "epoch": 53.22, "grad_norm": 55.14971923828125, "learning_rate": 3.1176750351382235e-07, "loss": 0.3817, "step": 26610 }, { "epoch": 53.28, "grad_norm": 221.3983917236328, "learning_rate": 3.0633071173062966e-07, "loss": 0.4345, "step": 26640 }, { "epoch": 53.34, "grad_norm": 42.98983383178711, "learning_rate": 3.0094024456840176e-07, "loss": 0.4081, "step": 26670 }, { "epoch": 53.4, "grad_norm": 53.3066291809082, "learning_rate": 2.9559615522887275e-07, "loss": 0.402, "step": 26700 }, { "epoch": 53.46, "grad_norm": 70.44734191894531, "learning_rate": 2.9029849645604735e-07, "loss": 0.4517, "step": 26730 }, { "epoch": 53.52, "grad_norm": 49.392723083496094, "learning_rate": 2.850473205356774e-07, "loss": 0.3977, "step": 26760 }, { "epoch": 53.58, "grad_norm": 77.64625549316406, "learning_rate": 2.798426792947517e-07, "loss": 0.4356, "step": 26790 }, { "epoch": 53.64, "grad_norm": 59.67546081542969, "learning_rate": 2.746846241009765e-07, "loss": 0.5099, "step": 26820 }, { "epoch": 53.7, "grad_norm": 136.89759826660156, "learning_rate": 2.6957320586227354e-07, "loss": 0.3658, "step": 26850 }, { "epoch": 53.76, "grad_norm": 64.72844696044922, "learning_rate": 2.6450847502627883e-07, "loss": 0.5296, "step": 26880 }, { "epoch": 53.82, "grad_norm": 134.72019958496094, "learning_rate": 2.594904815798399e-07, "loss": 0.4809, "step": 26910 }, { "epoch": 53.88, "grad_norm": 373.54449462890625, "learning_rate": 2.5451927504852757e-07, "loss": 0.4206, "step": 26940 }, { "epoch": 53.94, "grad_norm": 53.72751998901367, "learning_rate": 2.49594904496141e-07, "loss": 0.368, "step": 26970 }, { "epoch": 54.0, "grad_norm": 68.3394546508789, "learning_rate": 2.447174185242324e-07, "loss": 0.4004, "step": 27000 }, { "epoch": 54.0, "eval_loss": 0.28688502311706543, "eval_map": 0.7973, "eval_map_50": 0.9644, "eval_map_75": 0.9201, "eval_map_chicken": 0.801, "eval_map_duck": 0.7636, "eval_map_large": 0.8813, "eval_map_medium": 0.7957, "eval_map_plant": 0.8273, "eval_map_small": 0.228, "eval_mar_1": 0.3069, "eval_mar_10": 0.8328, "eval_mar_100": 0.8368, "eval_mar_100_chicken": 0.8373, "eval_mar_100_duck": 0.7948, "eval_mar_100_plant": 0.8781, "eval_mar_large": 0.9218, "eval_mar_medium": 0.8456, "eval_mar_small": 0.3822, "eval_runtime": 5.2392, "eval_samples_per_second": 19.087, "eval_steps_per_second": 2.481, "step": 27000 }, { "epoch": 54.06, "grad_norm": 70.93304443359375, "learning_rate": 2.3988686527161686e-07, "loss": 0.3863, "step": 27030 }, { "epoch": 54.12, "grad_norm": 427.5562438964844, "learning_rate": 2.351032924139063e-07, "loss": 0.4965, "step": 27060 }, { "epoch": 54.18, "grad_norm": 0.00017418510105926543, "learning_rate": 2.3036674716303277e-07, "loss": 0.4601, "step": 27090 }, { "epoch": 54.24, "grad_norm": 59.90283203125, "learning_rate": 2.2567727626678527e-07, "loss": 0.3882, "step": 27120 }, { "epoch": 54.3, "grad_norm": 60.470008850097656, "learning_rate": 2.210349260083494e-07, "loss": 0.4183, "step": 27150 }, { "epoch": 54.36, "grad_norm": 54.06813430786133, "learning_rate": 2.1643974220584729e-07, "loss": 0.4768, "step": 27180 }, { "epoch": 54.42, "grad_norm": 37.11991882324219, "learning_rate": 2.1189177021188888e-07, "loss": 0.402, "step": 27210 }, { "epoch": 54.48, "grad_norm": 89.20401763916016, "learning_rate": 2.0739105491312028e-07, "loss": 0.4153, "step": 27240 }, { "epoch": 54.54, "grad_norm": 56.34545135498047, "learning_rate": 2.0293764072978618e-07, "loss": 0.408, "step": 27270 }, { "epoch": 54.6, "grad_norm": 97.46742248535156, "learning_rate": 1.9853157161528468e-07, "loss": 0.4485, "step": 27300 }, { "epoch": 54.66, "grad_norm": 48.18669509887695, "learning_rate": 1.9417289105574054e-07, "loss": 0.4489, "step": 27330 }, { "epoch": 54.72, "grad_norm": 62.39783477783203, "learning_rate": 1.8986164206957037e-07, "loss": 0.3776, "step": 27360 }, { "epoch": 54.78, "grad_norm": 0.000213187318877317, "learning_rate": 1.8559786720706185e-07, "loss": 0.3596, "step": 27390 }, { "epoch": 54.84, "grad_norm": 97.40396118164062, "learning_rate": 1.8138160854995145e-07, "loss": 0.4219, "step": 27420 }, { "epoch": 54.9, "grad_norm": 42.91602325439453, "learning_rate": 1.7721290771100964e-07, "loss": 0.4467, "step": 27450 }, { "epoch": 54.96, "grad_norm": 46.58220291137695, "learning_rate": 1.7309180583363062e-07, "loss": 0.406, "step": 27480 }, { "epoch": 55.0, "eval_loss": 0.28708022832870483, "eval_map": 0.8004, "eval_map_50": 0.9645, "eval_map_75": 0.9194, "eval_map_chicken": 0.8069, "eval_map_duck": 0.7679, "eval_map_large": 0.8788, "eval_map_medium": 0.7986, "eval_map_plant": 0.8265, "eval_map_small": 0.2283, "eval_mar_1": 0.3084, "eval_mar_10": 0.8343, "eval_mar_100": 0.8384, "eval_mar_100_chicken": 0.8404, "eval_mar_100_duck": 0.7979, "eval_mar_100_plant": 0.8769, "eval_mar_large": 0.9205, "eval_mar_medium": 0.8476, "eval_mar_small": 0.3822, "eval_runtime": 5.0648, "eval_samples_per_second": 19.744, "eval_steps_per_second": 2.567, "step": 27500 }, { "epoch": 55.02, "grad_norm": 44.80258560180664, "learning_rate": 1.690183435914261e-07, "loss": 0.4592, "step": 27510 }, { "epoch": 55.08, "grad_norm": 46.293399810791016, "learning_rate": 1.6499256118782503e-07, "loss": 0.4603, "step": 27540 }, { "epoch": 55.14, "grad_norm": 0.00020682995091192424, "learning_rate": 1.6101449835567273e-07, "loss": 0.3691, "step": 27570 }, { "epoch": 55.2, "grad_norm": 0.00038863185909576714, "learning_rate": 1.5708419435684463e-07, "loss": 0.3658, "step": 27600 }, { "epoch": 55.26, "grad_norm": 64.51366424560547, "learning_rate": 1.532016879818532e-07, "loss": 0.4051, "step": 27630 }, { "epoch": 55.32, "grad_norm": 137.62094116210938, "learning_rate": 1.4936701754947104e-07, "loss": 0.3851, "step": 27660 }, { "epoch": 55.38, "grad_norm": 32.709232330322266, "learning_rate": 1.4558022090634504e-07, "loss": 0.4879, "step": 27690 }, { "epoch": 55.44, "grad_norm": 40.718658447265625, "learning_rate": 1.4184133542663014e-07, "loss": 0.4211, "step": 27720 }, { "epoch": 55.5, "grad_norm": 65.1848373413086, "learning_rate": 1.3815039801161723e-07, "loss": 0.4523, "step": 27750 }, { "epoch": 55.56, "grad_norm": 37.71095657348633, "learning_rate": 1.3450744508936687e-07, "loss": 0.3766, "step": 27780 }, { "epoch": 55.62, "grad_norm": 58.59610366821289, "learning_rate": 1.3091251261435568e-07, "loss": 0.4531, "step": 27810 }, { "epoch": 55.68, "grad_norm": 38.84789276123047, "learning_rate": 1.2736563606711384e-07, "loss": 0.3873, "step": 27840 }, { "epoch": 55.74, "grad_norm": 0.0002489400503691286, "learning_rate": 1.2386685045388313e-07, "loss": 0.3393, "step": 27870 }, { "epoch": 55.8, "grad_norm": 122.7408218383789, "learning_rate": 1.2041619030626283e-07, "loss": 0.4669, "step": 27900 }, { "epoch": 55.86, "grad_norm": 0.0002524556184653193, "learning_rate": 1.1701368968087711e-07, "loss": 0.5525, "step": 27930 }, { "epoch": 55.92, "grad_norm": 32.06369400024414, "learning_rate": 1.136593821590326e-07, "loss": 0.3817, "step": 27960 }, { "epoch": 55.98, "grad_norm": 164.66461181640625, "learning_rate": 1.1035330084639084e-07, "loss": 0.3876, "step": 27990 }, { "epoch": 56.0, "eval_loss": 0.2882368564605713, "eval_map": 0.7985, "eval_map_50": 0.9641, "eval_map_75": 0.9197, "eval_map_chicken": 0.8072, "eval_map_duck": 0.7646, "eval_map_large": 0.8772, "eval_map_medium": 0.7974, "eval_map_plant": 0.8237, "eval_map_small": 0.2257, "eval_mar_1": 0.3084, "eval_mar_10": 0.834, "eval_mar_100": 0.838, "eval_mar_100_chicken": 0.8436, "eval_mar_100_duck": 0.7969, "eval_mar_100_plant": 0.8735, "eval_mar_large": 0.918, "eval_mar_medium": 0.8474, "eval_mar_small": 0.3676, "eval_runtime": 5.0534, "eval_samples_per_second": 19.788, "eval_steps_per_second": 2.573, "step": 28000 }, { "epoch": 56.04, "grad_norm": 101.48612213134766, "learning_rate": 1.0709547837263967e-07, "loss": 0.4297, "step": 28020 }, { "epoch": 56.1, "grad_norm": 32.960208892822266, "learning_rate": 1.038859468911707e-07, "loss": 0.3881, "step": 28050 }, { "epoch": 56.16, "grad_norm": 45.9619026184082, "learning_rate": 1.007247380787657e-07, "loss": 0.3947, "step": 28080 }, { "epoch": 56.22, "grad_norm": 50.23225784301758, "learning_rate": 9.761188313527792e-08, "loss": 0.4163, "step": 28110 }, { "epoch": 56.28, "grad_norm": 69.35472106933594, "learning_rate": 9.454741278333013e-08, "loss": 0.4509, "step": 28140 }, { "epoch": 56.34, "grad_norm": 49.21049118041992, "learning_rate": 9.153135726800599e-08, "loss": 0.4435, "step": 28170 }, { "epoch": 56.4, "grad_norm": 24.567251205444336, "learning_rate": 8.856374635655696e-08, "loss": 0.435, "step": 28200 }, { "epoch": 56.46, "grad_norm": 41.68861770629883, "learning_rate": 8.564460933810414e-08, "loss": 0.4124, "step": 28230 }, { "epoch": 56.52, "grad_norm": 62.273746490478516, "learning_rate": 8.277397502335194e-08, "loss": 0.4942, "step": 28260 }, { "epoch": 56.58, "grad_norm": 38.9687385559082, "learning_rate": 7.995187174430152e-08, "loss": 0.3975, "step": 28290 }, { "epoch": 56.64, "grad_norm": 60.86214828491211, "learning_rate": 7.717832735397335e-08, "loss": 0.3889, "step": 28320 }, { "epoch": 56.7, "grad_norm": 106.79747009277344, "learning_rate": 7.445336922613067e-08, "loss": 0.3872, "step": 28350 }, { "epoch": 56.76, "grad_norm": 185.20068359375, "learning_rate": 7.177702425500977e-08, "loss": 0.3844, "step": 28380 }, { "epoch": 56.82, "grad_norm": 44.18353271484375, "learning_rate": 6.914931885505626e-08, "loss": 0.4314, "step": 28410 }, { "epoch": 56.88, "grad_norm": 41.35288619995117, "learning_rate": 6.657027896065982e-08, "loss": 0.4599, "step": 28440 }, { "epoch": 56.94, "grad_norm": 294.2066345214844, "learning_rate": 6.403993002590425e-08, "loss": 0.3814, "step": 28470 }, { "epoch": 57.0, "grad_norm": 38.01483154296875, "learning_rate": 6.15582970243117e-08, "loss": 0.3939, "step": 28500 }, { "epoch": 57.0, "eval_loss": 0.28454330563545227, "eval_map": 0.8024, "eval_map_50": 0.9645, "eval_map_75": 0.9195, "eval_map_chicken": 0.8102, "eval_map_duck": 0.7709, "eval_map_large": 0.8782, "eval_map_medium": 0.8014, "eval_map_plant": 0.8262, "eval_map_small": 0.2291, "eval_mar_1": 0.3093, "eval_mar_10": 0.8367, "eval_mar_100": 0.8405, "eval_mar_100_chicken": 0.8431, "eval_mar_100_duck": 0.8021, "eval_mar_100_plant": 0.8764, "eval_mar_large": 0.9197, "eval_mar_medium": 0.8511, "eval_mar_small": 0.3697, "eval_runtime": 5.2741, "eval_samples_per_second": 18.961, "eval_steps_per_second": 2.465, "step": 28500 }, { "epoch": 57.06, "grad_norm": 40.22798156738281, "learning_rate": 5.9125404448597825e-08, "loss": 0.4592, "step": 28530 }, { "epoch": 57.12, "grad_norm": 227.82638549804688, "learning_rate": 5.674127631043025e-08, "loss": 0.3248, "step": 28560 }, { "epoch": 57.18, "grad_norm": 31.734601974487305, "learning_rate": 5.440593614019107e-08, "loss": 0.3187, "step": 28590 }, { "epoch": 57.24, "grad_norm": 49.92489242553711, "learning_rate": 5.2119406986745336e-08, "loss": 0.3835, "step": 28620 }, { "epoch": 57.3, "grad_norm": 92.18814849853516, "learning_rate": 4.988171141721232e-08, "loss": 0.4056, "step": 28650 }, { "epoch": 57.36, "grad_norm": 53.62547302246094, "learning_rate": 4.769287151674407e-08, "loss": 0.4088, "step": 28680 }, { "epoch": 57.42, "grad_norm": 53.25278091430664, "learning_rate": 4.5552908888306654e-08, "loss": 0.4545, "step": 28710 }, { "epoch": 57.48, "grad_norm": 47.75865173339844, "learning_rate": 4.346184465246761e-08, "loss": 0.4104, "step": 28740 }, { "epoch": 57.54, "grad_norm": 69.6591796875, "learning_rate": 4.1419699447186045e-08, "loss": 0.4026, "step": 28770 }, { "epoch": 57.6, "grad_norm": 50.19314956665039, "learning_rate": 3.9426493427611177e-08, "loss": 0.3975, "step": 28800 }, { "epoch": 57.66, "grad_norm": 54.0328369140625, "learning_rate": 3.748224626588137e-08, "loss": 0.6515, "step": 28830 }, { "epoch": 57.72, "grad_norm": 39.40961837768555, "learning_rate": 3.558697715093207e-08, "loss": 0.406, "step": 28860 }, { "epoch": 57.78, "grad_norm": 43.196834564208984, "learning_rate": 3.374070478830316e-08, "loss": 0.4559, "step": 28890 }, { "epoch": 57.84, "grad_norm": 23.547550201416016, "learning_rate": 3.194344739995803e-08, "loss": 0.605, "step": 28920 }, { "epoch": 57.9, "grad_norm": 69.10009765625, "learning_rate": 3.019522272410202e-08, "loss": 0.4126, "step": 28950 }, { "epoch": 57.96, "grad_norm": 66.09160614013672, "learning_rate": 2.8496048015005385e-08, "loss": 0.4218, "step": 28980 }, { "epoch": 58.0, "eval_loss": 0.2852034270763397, "eval_map": 0.8, "eval_map_50": 0.9646, "eval_map_75": 0.9196, "eval_map_chicken": 0.8067, "eval_map_duck": 0.7689, "eval_map_large": 0.8774, "eval_map_medium": 0.7993, "eval_map_plant": 0.8245, "eval_map_small": 0.2254, "eval_mar_1": 0.3085, "eval_mar_10": 0.8346, "eval_mar_100": 0.8384, "eval_mar_100_chicken": 0.8413, "eval_mar_100_duck": 0.799, "eval_mar_100_plant": 0.8749, "eval_mar_large": 0.9188, "eval_mar_medium": 0.8488, "eval_mar_small": 0.3634, "eval_runtime": 5.0721, "eval_samples_per_second": 19.716, "eval_steps_per_second": 2.563, "step": 29000 }, { "epoch": 58.02, "grad_norm": 69.85868072509766, "learning_rate": 2.684594004283836e-08, "loss": 0.4304, "step": 29010 }, { "epoch": 58.08, "grad_norm": 41.767555236816406, "learning_rate": 2.5244915093499134e-08, "loss": 0.3461, "step": 29040 }, { "epoch": 58.14, "grad_norm": 82.25499725341797, "learning_rate": 2.3692988968458398e-08, "loss": 0.5096, "step": 29070 }, { "epoch": 58.2, "grad_norm": 54.37453079223633, "learning_rate": 2.219017698460002e-08, "loss": 0.4233, "step": 29100 }, { "epoch": 58.26, "grad_norm": 61.195838928222656, "learning_rate": 2.0736493974071736e-08, "loss": 0.3487, "step": 29130 }, { "epoch": 58.32, "grad_norm": 28.579872131347656, "learning_rate": 1.9331954284137476e-08, "loss": 0.3522, "step": 29160 }, { "epoch": 58.38, "grad_norm": 56.89299774169922, "learning_rate": 1.7976571777038044e-08, "loss": 0.3813, "step": 29190 }, { "epoch": 58.44, "grad_norm": 56.8980598449707, "learning_rate": 1.6670359829850657e-08, "loss": 0.4162, "step": 29220 }, { "epoch": 58.5, "grad_norm": 39.616416931152344, "learning_rate": 1.541333133436018e-08, "loss": 0.4343, "step": 29250 }, { "epoch": 58.56, "grad_norm": 47.3499641418457, "learning_rate": 1.4205498696930332e-08, "loss": 0.3844, "step": 29280 }, { "epoch": 58.62, "grad_norm": 49.85858917236328, "learning_rate": 1.3046873838381546e-08, "loss": 0.4488, "step": 29310 }, { "epoch": 58.68, "grad_norm": 63.439273834228516, "learning_rate": 1.1937468193873869e-08, "loss": 0.4068, "step": 29340 }, { "epoch": 58.74, "grad_norm": 22.61992835998535, "learning_rate": 1.0877292712792586e-08, "loss": 0.3993, "step": 29370 }, { "epoch": 58.8, "grad_norm": 182.1600799560547, "learning_rate": 9.866357858642206e-09, "loss": 0.3899, "step": 29400 }, { "epoch": 58.86, "grad_norm": 54.466739654541016, "learning_rate": 8.904673608940983e-09, "loss": 0.394, "step": 29430 }, { "epoch": 58.92, "grad_norm": 56.43994903564453, "learning_rate": 7.992249455124889e-09, "loss": 0.3792, "step": 29460 }, { "epoch": 58.98, "grad_norm": 29.733278274536133, "learning_rate": 7.129094402451575e-09, "loss": 0.4046, "step": 29490 }, { "epoch": 59.0, "eval_loss": 0.2850831151008606, "eval_map": 0.8008, "eval_map_50": 0.9645, "eval_map_75": 0.9196, "eval_map_chicken": 0.8079, "eval_map_duck": 0.7689, "eval_map_large": 0.878, "eval_map_medium": 0.8002, "eval_map_plant": 0.8256, "eval_map_small": 0.2283, "eval_mar_1": 0.3087, "eval_mar_10": 0.835, "eval_mar_100": 0.8388, "eval_mar_100_chicken": 0.8418, "eval_mar_100_duck": 0.799, "eval_mar_100_plant": 0.8758, "eval_mar_large": 0.9188, "eval_mar_medium": 0.8497, "eval_mar_small": 0.3655, "eval_runtime": 5.5802, "eval_samples_per_second": 17.921, "eval_steps_per_second": 2.33, "step": 29500 }, { "epoch": 59.04, "grad_norm": 29.91386604309082, "learning_rate": 6.315216969912663e-09, "loss": 0.3851, "step": 29520 }, { "epoch": 59.1, "grad_norm": 505.2102355957031, "learning_rate": 5.5506251901504825e-09, "loss": 0.3666, "step": 29550 }, { "epoch": 59.16, "grad_norm": 45.7656135559082, "learning_rate": 4.835326609376468e-09, "loss": 0.4178, "step": 29580 }, { "epoch": 59.22, "grad_norm": 56.061153411865234, "learning_rate": 4.169328287299545e-09, "loss": 0.4697, "step": 29610 }, { "epoch": 59.28, "grad_norm": 93.67945098876953, "learning_rate": 3.5526367970539765e-09, "loss": 0.3581, "step": 29640 }, { "epoch": 59.34, "grad_norm": 56.09961700439453, "learning_rate": 2.9852582251355124e-09, "loss": 0.4007, "step": 29670 }, { "epoch": 59.4, "grad_norm": 95.72340393066406, "learning_rate": 2.4671981713420003e-09, "loss": 0.4338, "step": 29700 }, { "epoch": 59.46, "grad_norm": 73.806884765625, "learning_rate": 1.9984617487173174e-09, "loss": 0.4488, "step": 29730 }, { "epoch": 59.52, "grad_norm": 63.850746154785156, "learning_rate": 1.5790535835003006e-09, "loss": 0.4424, "step": 29760 }, { "epoch": 59.58, "grad_norm": 54.269371032714844, "learning_rate": 1.2089778150797816e-09, "loss": 0.4145, "step": 29790 }, { "epoch": 59.64, "grad_norm": 45.143714904785156, "learning_rate": 8.88238095955174e-10, "loss": 0.4422, "step": 29820 }, { "epoch": 59.7, "grad_norm": 32.879642486572266, "learning_rate": 6.168375916970615e-10, "loss": 0.3915, "step": 29850 }, { "epoch": 59.76, "grad_norm": 68.58180236816406, "learning_rate": 3.9477898091944135e-10, "loss": 0.423, "step": 29880 }, { "epoch": 59.82, "grad_norm": 57.879634857177734, "learning_rate": 2.2206445525085886e-10, "loss": 0.4619, "step": 29910 }, { "epoch": 59.88, "grad_norm": 133.5286102294922, "learning_rate": 9.869571931442334e-11, "loss": 0.3987, "step": 29940 }, { "epoch": 59.94, "grad_norm": 63.78921127319336, "learning_rate": 2.467399070893439e-11, "loss": 0.3533, "step": 29970 }, { "epoch": 60.0, "grad_norm": 65.49594116210938, "learning_rate": 0.0, "loss": 0.4504, "step": 30000 }, { "epoch": 60.0, "eval_loss": 0.28507041931152344, "eval_map": 0.8003, "eval_map_50": 0.9645, "eval_map_75": 0.9196, "eval_map_chicken": 0.8072, "eval_map_duck": 0.7689, "eval_map_large": 0.8772, "eval_map_medium": 0.7999, "eval_map_plant": 0.8248, "eval_map_small": 0.2246, "eval_mar_1": 0.3086, "eval_mar_10": 0.8346, "eval_mar_100": 0.8384, "eval_mar_100_chicken": 0.8413, "eval_mar_100_duck": 0.799, "eval_mar_100_plant": 0.8749, "eval_mar_large": 0.918, "eval_mar_medium": 0.8496, "eval_mar_small": 0.3614, "eval_runtime": 5.2733, "eval_samples_per_second": 18.963, "eval_steps_per_second": 2.465, "step": 30000 } ], "logging_steps": 30, "max_steps": 30000, "num_input_tokens_seen": 0, "num_train_epochs": 60, "save_steps": 10, "stateful_callbacks": { "TrainerControl": { "args": { "should_epoch_stop": false, "should_evaluate": false, "should_log": false, "should_save": true, "should_training_stop": true }, "attributes": {} } }, "total_flos": 1.0320693387264e+19, "train_batch_size": 2, "trial_name": null, "trial_params": null }