diff --git "a/last-checkpoint/trainer_state.json" "b/last-checkpoint/trainer_state.json" --- "a/last-checkpoint/trainer_state.json" +++ "b/last-checkpoint/trainer_state.json" @@ -1,9 +1,9 @@ { - "best_metric": 0.28515276312828064, - "best_model_checkpoint": "chickens-composite-201616161616-150-epochs-w-transform/checkpoint-69500", - "epoch": 149.0, + "best_metric": 0.3433947265148163, + "best_model_checkpoint": "chickens-composite-201616161616-150-epochs-w-transform/checkpoint-33000", + "epoch": 70.0, "eval_steps": 500, - "global_step": 74500, + "global_step": 35000, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, @@ -9989,11279 +9989,6 @@ "eval_samples_per_second": 6.927, "eval_steps_per_second": 0.901, "step": 35000 - }, - { - "epoch": 70.02, - "grad_norm": 57.60066223144531, - "learning_rate": 5.520559348760984e-06, - "loss": 0.2609, - "step": 35010 - }, - { - "epoch": 70.08, - "grad_norm": 57.3175048828125, - "learning_rate": 5.514309899468209e-06, - "loss": 0.4133, - "step": 35040 - }, - { - "epoch": 70.14, - "grad_norm": 42.147911071777344, - "learning_rate": 5.5080596380099e-06, - "loss": 0.4609, - "step": 35070 - }, - { - "epoch": 70.2, - "grad_norm": 35.86623764038086, - "learning_rate": 5.5018085742560745e-06, - "loss": 0.4458, - "step": 35100 - }, - { - "epoch": 70.26, - "grad_norm": 31.622404098510742, - "learning_rate": 5.495556718078017e-06, - "loss": 0.3592, - "step": 35130 - }, - { - "epoch": 70.32, - "grad_norm": 239.2526092529297, - "learning_rate": 5.489304079348259e-06, - "loss": 0.4239, - "step": 35160 - }, - { - "epoch": 70.38, - "grad_norm": 98.21315002441406, - "learning_rate": 5.483050667940571e-06, - "loss": 0.36, - "step": 35190 - }, - { - "epoch": 70.44, - "grad_norm": 60.83596420288086, - "learning_rate": 5.476796493729943e-06, - "loss": 0.358, - "step": 35220 - }, - { - "epoch": 70.5, - "grad_norm": 126.31898498535156, - "learning_rate": 5.470541566592573e-06, - "loss": 0.3843, - "step": 35250 - }, - { - "epoch": 70.56, - "grad_norm": 55.7030143737793, - "learning_rate": 5.46428589640584e-06, - "loss": 0.3776, - "step": 35280 - }, - { - "epoch": 70.62, - "grad_norm": 92.43096923828125, - "learning_rate": 5.458029493048303e-06, - "loss": 0.4364, - "step": 35310 - }, - { - "epoch": 70.68, - "grad_norm": 101.4725112915039, - "learning_rate": 5.451772366399678e-06, - "loss": 0.4747, - "step": 35340 - }, - { - "epoch": 70.74, - "grad_norm": 41.27867889404297, - "learning_rate": 5.445514526340822e-06, - "loss": 0.4274, - "step": 35370 - }, - { - "epoch": 70.8, - "grad_norm": 40.24786376953125, - "learning_rate": 5.439255982753717e-06, - "loss": 0.3721, - "step": 35400 - }, - { - "epoch": 70.86, - "grad_norm": 0.00015866973262745887, - "learning_rate": 5.432996745521458e-06, - "loss": 0.3285, - "step": 35430 - }, - { - "epoch": 70.92, - "grad_norm": 36.108192443847656, - "learning_rate": 5.426736824528236e-06, - "loss": 0.4343, - "step": 35460 - }, - { - "epoch": 70.98, - "grad_norm": 86.65865325927734, - "learning_rate": 5.420476229659319e-06, - "loss": 0.3662, - "step": 35490 - }, - { - "epoch": 71.0, - "eval_loss": 0.34761255979537964, - "eval_map": 0.748, - "eval_map_50": 0.9477, - "eval_map_75": 0.8928, - "eval_map_chicken": 0.7374, - "eval_map_duck": 0.6861, - "eval_map_large": 0.7833, - "eval_map_medium": 0.7423, - "eval_map_plant": 0.8204, - "eval_map_small": 0.2295, - "eval_mar_1": 0.3014, - "eval_mar_10": 0.791, - "eval_mar_100": 0.7964, - "eval_mar_100_chicken": 0.7873, - "eval_mar_100_duck": 0.7361, - "eval_mar_100_plant": 0.8658, - "eval_mar_large": 0.8305, - "eval_mar_medium": 0.7918, - "eval_mar_small": 0.3529, - "eval_runtime": 13.7844, - "eval_samples_per_second": 7.255, - "eval_steps_per_second": 0.943, - "step": 35500 - }, - { - "epoch": 71.04, - "grad_norm": 97.59375762939453, - "learning_rate": 5.414214970801041e-06, - "loss": 0.4473, - "step": 35520 - }, - { - "epoch": 71.1, - "grad_norm": 100.36852264404297, - "learning_rate": 5.4079530578407895e-06, - "loss": 0.4027, - "step": 35550 - }, - { - "epoch": 71.16, - "grad_norm": 106.83638000488281, - "learning_rate": 5.401690500666972e-06, - "loss": 0.3901, - "step": 35580 - }, - { - "epoch": 71.22, - "grad_norm": 48.40634536743164, - "learning_rate": 5.3954273091690245e-06, - "loss": 0.5003, - "step": 35610 - }, - { - "epoch": 71.28, - "grad_norm": 59.99224090576172, - "learning_rate": 5.389163493237382e-06, - "loss": 0.4407, - "step": 35640 - }, - { - "epoch": 71.34, - "grad_norm": 64.60873413085938, - "learning_rate": 5.3828990627634655e-06, - "loss": 0.3974, - "step": 35670 - }, - { - "epoch": 71.4, - "grad_norm": 27.694753646850586, - "learning_rate": 5.376634027639664e-06, - "loss": 0.4294, - "step": 35700 - }, - { - "epoch": 71.46, - "grad_norm": 62.43673324584961, - "learning_rate": 5.370368397759324e-06, - "loss": 0.3916, - "step": 35730 - }, - { - "epoch": 71.52, - "grad_norm": 37.97948455810547, - "learning_rate": 5.36410218301673e-06, - "loss": 0.4086, - "step": 35760 - }, - { - "epoch": 71.58, - "grad_norm": 61.94252395629883, - "learning_rate": 5.357835393307089e-06, - "loss": 0.6577, - "step": 35790 - }, - { - "epoch": 71.64, - "grad_norm": 67.63701629638672, - "learning_rate": 5.35156803852652e-06, - "loss": 0.3936, - "step": 35820 - }, - { - "epoch": 71.7, - "grad_norm": 22.23328399658203, - "learning_rate": 5.345300128572031e-06, - "loss": 0.3829, - "step": 35850 - }, - { - "epoch": 71.76, - "grad_norm": 142.47900390625, - "learning_rate": 5.339031673341505e-06, - "loss": 0.4316, - "step": 35880 - }, - { - "epoch": 71.82, - "grad_norm": 58.364990234375, - "learning_rate": 5.3327626827336906e-06, - "loss": 0.4404, - "step": 35910 - }, - { - "epoch": 71.88, - "grad_norm": 99.14762115478516, - "learning_rate": 5.326493166648179e-06, - "loss": 0.3472, - "step": 35940 - }, - { - "epoch": 71.94, - "grad_norm": 32.37788772583008, - "learning_rate": 5.320223134985393e-06, - "loss": 0.4483, - "step": 35970 - }, - { - "epoch": 72.0, - "grad_norm": 114.78788757324219, - "learning_rate": 5.3139525976465675e-06, - "loss": 0.4244, - "step": 36000 - }, - { - "epoch": 72.0, - "eval_loss": 0.3509241044521332, - "eval_map": 0.7518, - "eval_map_50": 0.9432, - "eval_map_75": 0.8724, - "eval_map_chicken": 0.7548, - "eval_map_duck": 0.6835, - "eval_map_large": 0.7649, - "eval_map_medium": 0.7471, - "eval_map_plant": 0.8172, - "eval_map_small": 0.2416, - "eval_mar_1": 0.2982, - "eval_mar_10": 0.792, - "eval_mar_100": 0.797, - "eval_mar_100_chicken": 0.8004, - "eval_mar_100_duck": 0.7299, - "eval_mar_100_plant": 0.8606, - "eval_mar_large": 0.8121, - "eval_mar_medium": 0.7909, - "eval_mar_small": 0.3657, - "eval_runtime": 12.3679, - "eval_samples_per_second": 8.085, - "eval_steps_per_second": 1.051, - "step": 36000 - }, - { - "epoch": 72.06, - "grad_norm": 131.61239624023438, - "learning_rate": 5.307681564533736e-06, - "loss": 0.5087, - "step": 36030 - }, - { - "epoch": 72.12, - "grad_norm": 33.683692932128906, - "learning_rate": 5.301410045549719e-06, - "loss": 0.4199, - "step": 36060 - }, - { - "epoch": 72.18, - "grad_norm": 48.458431243896484, - "learning_rate": 5.295138050598097e-06, - "loss": 0.4408, - "step": 36090 - }, - { - "epoch": 72.24, - "grad_norm": 322.8694763183594, - "learning_rate": 5.2888655895832075e-06, - "loss": 0.3678, - "step": 36120 - }, - { - "epoch": 72.3, - "grad_norm": 219.04263305664062, - "learning_rate": 5.282592672410124e-06, - "loss": 0.4441, - "step": 36150 - }, - { - "epoch": 72.36, - "grad_norm": 124.94686889648438, - "learning_rate": 5.276319308984637e-06, - "loss": 0.4186, - "step": 36180 - }, - { - "epoch": 72.42, - "grad_norm": 83.0042495727539, - "learning_rate": 5.270045509213244e-06, - "loss": 0.4637, - "step": 36210 - }, - { - "epoch": 72.48, - "grad_norm": 87.41633605957031, - "learning_rate": 5.263771283003133e-06, - "loss": 0.3709, - "step": 36240 - }, - { - "epoch": 72.54, - "grad_norm": 59.93210220336914, - "learning_rate": 5.2574966402621615e-06, - "loss": 0.4324, - "step": 36270 - }, - { - "epoch": 72.6, - "grad_norm": 33.1005859375, - "learning_rate": 5.251221590898848e-06, - "loss": 0.4372, - "step": 36300 - }, - { - "epoch": 72.66, - "grad_norm": 57.52750778198242, - "learning_rate": 5.244946144822351e-06, - "loss": 0.3991, - "step": 36330 - }, - { - "epoch": 72.72, - "grad_norm": 43.97096252441406, - "learning_rate": 5.238670311942459e-06, - "loss": 0.4409, - "step": 36360 - }, - { - "epoch": 72.78, - "grad_norm": 37.51517105102539, - "learning_rate": 5.232394102169566e-06, - "loss": 0.4786, - "step": 36390 - }, - { - "epoch": 72.84, - "grad_norm": 53.2791748046875, - "learning_rate": 5.226117525414663e-06, - "loss": 0.419, - "step": 36420 - }, - { - "epoch": 72.9, - "grad_norm": 46.237361907958984, - "learning_rate": 5.219840591589325e-06, - "loss": 0.3777, - "step": 36450 - }, - { - "epoch": 72.96, - "grad_norm": 200.5348358154297, - "learning_rate": 5.213563310605686e-06, - "loss": 0.4483, - "step": 36480 - }, - { - "epoch": 73.0, - "eval_loss": 0.35082873702049255, - "eval_map": 0.7472, - "eval_map_50": 0.9483, - "eval_map_75": 0.897, - "eval_map_chicken": 0.738, - "eval_map_duck": 0.6835, - "eval_map_large": 0.7725, - "eval_map_medium": 0.753, - "eval_map_plant": 0.8201, - "eval_map_small": 0.2306, - "eval_mar_1": 0.2979, - "eval_mar_10": 0.7963, - "eval_mar_100": 0.8027, - "eval_mar_100_chicken": 0.7944, - "eval_mar_100_duck": 0.7474, - "eval_mar_100_plant": 0.8664, - "eval_mar_large": 0.8304, - "eval_mar_medium": 0.8053, - "eval_mar_small": 0.409, - "eval_runtime": 12.2563, - "eval_samples_per_second": 8.159, - "eval_steps_per_second": 1.061, - "step": 36500 - }, - { - "epoch": 73.02, - "grad_norm": 57.14048385620117, - "learning_rate": 5.207285692376427e-06, - "loss": 0.4022, - "step": 36510 - }, - { - "epoch": 73.08, - "grad_norm": 42.06671142578125, - "learning_rate": 5.201007746814767e-06, - "loss": 0.3748, - "step": 36540 - }, - { - "epoch": 73.14, - "grad_norm": 74.05252838134766, - "learning_rate": 5.194729483834438e-06, - "loss": 0.4788, - "step": 36570 - }, - { - "epoch": 73.2, - "grad_norm": 39.29936981201172, - "learning_rate": 5.188450913349674e-06, - "loss": 0.4776, - "step": 36600 - }, - { - "epoch": 73.26, - "grad_norm": 73.78974151611328, - "learning_rate": 5.1821720452751945e-06, - "loss": 0.3631, - "step": 36630 - }, - { - "epoch": 73.32, - "grad_norm": 55.11795425415039, - "learning_rate": 5.175892889526189e-06, - "loss": 0.3919, - "step": 36660 - }, - { - "epoch": 73.38, - "grad_norm": 35.68388366699219, - "learning_rate": 5.1696134560183045e-06, - "loss": 0.3749, - "step": 36690 - }, - { - "epoch": 73.44, - "grad_norm": 51.747650146484375, - "learning_rate": 5.16333375466762e-06, - "loss": 0.4091, - "step": 36720 - }, - { - "epoch": 73.5, - "grad_norm": 66.83267974853516, - "learning_rate": 5.157053795390642e-06, - "loss": 0.4367, - "step": 36750 - }, - { - "epoch": 73.56, - "grad_norm": 29.858856201171875, - "learning_rate": 5.150773588104284e-06, - "loss": 0.4849, - "step": 36780 - }, - { - "epoch": 73.62, - "grad_norm": 34.38462829589844, - "learning_rate": 5.144493142725851e-06, - "loss": 0.3771, - "step": 36810 - }, - { - "epoch": 73.68, - "grad_norm": 60.14284133911133, - "learning_rate": 5.138212469173022e-06, - "loss": 0.4495, - "step": 36840 - }, - { - "epoch": 73.74, - "grad_norm": 118.01911163330078, - "learning_rate": 5.13193157736384e-06, - "loss": 0.4251, - "step": 36870 - }, - { - "epoch": 73.8, - "grad_norm": 112.14728546142578, - "learning_rate": 5.1256504772166885e-06, - "loss": 0.3839, - "step": 36900 - }, - { - "epoch": 73.86, - "grad_norm": 59.46623992919922, - "learning_rate": 5.119369178650282e-06, - "loss": 0.3774, - "step": 36930 - }, - { - "epoch": 73.92, - "grad_norm": 78.6153335571289, - "learning_rate": 5.1130876915836495e-06, - "loss": 0.4722, - "step": 36960 - }, - { - "epoch": 73.98, - "grad_norm": 55.439579010009766, - "learning_rate": 5.1068060259361155e-06, - "loss": 0.4498, - "step": 36990 - }, - { - "epoch": 74.0, - "eval_loss": 0.3356999456882477, - "eval_map": 0.7632, - "eval_map_50": 0.9535, - "eval_map_75": 0.882, - "eval_map_chicken": 0.7617, - "eval_map_duck": 0.7007, - "eval_map_large": 0.7862, - "eval_map_medium": 0.7633, - "eval_map_plant": 0.8272, - "eval_map_small": 0.2094, - "eval_mar_1": 0.3069, - "eval_mar_10": 0.8033, - "eval_mar_100": 0.8087, - "eval_mar_100_chicken": 0.8091, - "eval_mar_100_duck": 0.7485, - "eval_mar_100_plant": 0.8685, - "eval_mar_large": 0.8324, - "eval_mar_medium": 0.8104, - "eval_mar_small": 0.3448, - "eval_runtime": 13.0612, - "eval_samples_per_second": 7.656, - "eval_steps_per_second": 0.995, - "step": 37000 - }, - { - "epoch": 74.04, - "grad_norm": 64.74147033691406, - "learning_rate": 5.100524191627289e-06, - "loss": 0.4194, - "step": 37020 - }, - { - "epoch": 74.1, - "grad_norm": 78.12037658691406, - "learning_rate": 5.0942421985770415e-06, - "loss": 0.4671, - "step": 37050 - }, - { - "epoch": 74.16, - "grad_norm": 94.69644927978516, - "learning_rate": 5.087960056705499e-06, - "loss": 0.3741, - "step": 37080 - }, - { - "epoch": 74.22, - "grad_norm": 33.74659729003906, - "learning_rate": 5.0816777759330215e-06, - "loss": 0.4425, - "step": 37110 - }, - { - "epoch": 74.28, - "grad_norm": 72.58914947509766, - "learning_rate": 5.075395366180186e-06, - "loss": 0.4312, - "step": 37140 - }, - { - "epoch": 74.34, - "grad_norm": 31.942522048950195, - "learning_rate": 5.069112837367777e-06, - "loss": 0.4246, - "step": 37170 - }, - { - "epoch": 74.4, - "grad_norm": 65.43937683105469, - "learning_rate": 5.062830199416764e-06, - "loss": 0.3582, - "step": 37200 - }, - { - "epoch": 74.46, - "grad_norm": 58.466304779052734, - "learning_rate": 5.05654746224829e-06, - "loss": 0.4749, - "step": 37230 - }, - { - "epoch": 74.52, - "grad_norm": 55.61424255371094, - "learning_rate": 5.050264635783654e-06, - "loss": 0.4461, - "step": 37260 - }, - { - "epoch": 74.58, - "grad_norm": 70.85432434082031, - "learning_rate": 5.043981729944298e-06, - "loss": 0.4671, - "step": 37290 - }, - { - "epoch": 74.64, - "grad_norm": 70.3757095336914, - "learning_rate": 5.037698754651786e-06, - "loss": 0.4394, - "step": 37320 - }, - { - "epoch": 74.7, - "grad_norm": 55.62226486206055, - "learning_rate": 5.031415719827796e-06, - "loss": 0.3489, - "step": 37350 - }, - { - "epoch": 74.76, - "grad_norm": 68.5845947265625, - "learning_rate": 5.025132635394095e-06, - "loss": 0.3887, - "step": 37380 - }, - { - "epoch": 74.82, - "grad_norm": 48.04725646972656, - "learning_rate": 5.018849511272532e-06, - "loss": 0.3496, - "step": 37410 - }, - { - "epoch": 74.88, - "grad_norm": 54.425209045410156, - "learning_rate": 5.0125663573850204e-06, - "loss": 0.354, - "step": 37440 - }, - { - "epoch": 74.94, - "grad_norm": 48.0417366027832, - "learning_rate": 5.006283183653513e-06, - "loss": 0.4457, - "step": 37470 - }, - { - "epoch": 75.0, - "grad_norm": 196.3993682861328, - "learning_rate": 5e-06, - "loss": 0.5208, - "step": 37500 - }, - { - "epoch": 75.0, - "eval_loss": 0.34921568632125854, - "eval_map": 0.7598, - "eval_map_50": 0.9506, - "eval_map_75": 0.8859, - "eval_map_chicken": 0.7466, - "eval_map_duck": 0.6987, - "eval_map_large": 0.7963, - "eval_map_medium": 0.7612, - "eval_map_plant": 0.834, - "eval_map_small": 0.2379, - "eval_mar_1": 0.3067, - "eval_mar_10": 0.7977, - "eval_mar_100": 0.8034, - "eval_mar_100_chicken": 0.7917, - "eval_mar_100_duck": 0.7454, - "eval_mar_100_plant": 0.873, - "eval_mar_large": 0.8349, - "eval_mar_medium": 0.8052, - "eval_mar_small": 0.3476, - "eval_runtime": 13.0356, - "eval_samples_per_second": 7.671, - "eval_steps_per_second": 0.997, - "step": 37500 - }, - { - "epoch": 75.06, - "grad_norm": 102.63311767578125, - "learning_rate": 4.99371681634649e-06, - "loss": 0.3792, - "step": 37530 - }, - { - "epoch": 75.12, - "grad_norm": 44.45432662963867, - "learning_rate": 4.987433642614981e-06, - "loss": 0.4996, - "step": 37560 - }, - { - "epoch": 75.18, - "grad_norm": 49.86972427368164, - "learning_rate": 4.981150488727469e-06, - "loss": 0.5486, - "step": 37590 - }, - { - "epoch": 75.24, - "grad_norm": 162.089599609375, - "learning_rate": 4.974867364605906e-06, - "loss": 0.3067, - "step": 37620 - }, - { - "epoch": 75.3, - "grad_norm": 93.43505859375, - "learning_rate": 4.968584280172206e-06, - "loss": 0.3471, - "step": 37650 - }, - { - "epoch": 75.36, - "grad_norm": 30.907535552978516, - "learning_rate": 4.962301245348215e-06, - "loss": 0.419, - "step": 37680 - }, - { - "epoch": 75.42, - "grad_norm": 43.338035583496094, - "learning_rate": 4.956018270055703e-06, - "loss": 0.4248, - "step": 37710 - }, - { - "epoch": 75.48, - "grad_norm": 76.43923950195312, - "learning_rate": 4.949735364216348e-06, - "loss": 0.3992, - "step": 37740 - }, - { - "epoch": 75.54, - "grad_norm": 35.369808197021484, - "learning_rate": 4.9434525377517115e-06, - "loss": 0.3867, - "step": 37770 - }, - { - "epoch": 75.6, - "grad_norm": 51.02500534057617, - "learning_rate": 4.937169800583237e-06, - "loss": 0.4073, - "step": 37800 - }, - { - "epoch": 75.66, - "grad_norm": 30.535675048828125, - "learning_rate": 4.930887162632225e-06, - "loss": 0.3618, - "step": 37830 - }, - { - "epoch": 75.72, - "grad_norm": 108.95599365234375, - "learning_rate": 4.924604633819815e-06, - "loss": 0.3753, - "step": 37860 - }, - { - "epoch": 75.78, - "grad_norm": 66.89957427978516, - "learning_rate": 4.91832222406698e-06, - "loss": 0.4943, - "step": 37890 - }, - { - "epoch": 75.84, - "grad_norm": 55.6713981628418, - "learning_rate": 4.912039943294502e-06, - "loss": 0.3789, - "step": 37920 - }, - { - "epoch": 75.9, - "grad_norm": 91.84227752685547, - "learning_rate": 4.90575780142296e-06, - "loss": 0.3718, - "step": 37950 - }, - { - "epoch": 75.96, - "grad_norm": 33.526302337646484, - "learning_rate": 4.899475808372714e-06, - "loss": 0.3542, - "step": 37980 - }, - { - "epoch": 76.0, - "eval_loss": 0.3491709232330322, - "eval_map": 0.7606, - "eval_map_50": 0.9431, - "eval_map_75": 0.8889, - "eval_map_chicken": 0.7548, - "eval_map_duck": 0.7124, - "eval_map_large": 0.7958, - "eval_map_medium": 0.7543, - "eval_map_plant": 0.8146, - "eval_map_small": 0.2385, - "eval_mar_1": 0.3072, - "eval_mar_10": 0.7975, - "eval_mar_100": 0.8028, - "eval_mar_100_chicken": 0.7988, - "eval_mar_100_duck": 0.7526, - "eval_mar_100_plant": 0.857, - "eval_mar_large": 0.8427, - "eval_mar_medium": 0.7957, - "eval_mar_small": 0.3724, - "eval_runtime": 13.3961, - "eval_samples_per_second": 7.465, - "eval_steps_per_second": 0.97, - "step": 38000 - }, - { - "epoch": 76.02, - "grad_norm": 176.4849853515625, - "learning_rate": 4.893193974063885e-06, - "loss": 0.4523, - "step": 38010 - }, - { - "epoch": 76.08, - "grad_norm": 188.09324645996094, - "learning_rate": 4.886912308416353e-06, - "loss": 0.4504, - "step": 38040 - }, - { - "epoch": 76.14, - "grad_norm": 46.274696350097656, - "learning_rate": 4.880630821349718e-06, - "loss": 0.4126, - "step": 38070 - }, - { - "epoch": 76.2, - "grad_norm": 155.42689514160156, - "learning_rate": 4.874349522783313e-06, - "loss": 0.3243, - "step": 38100 - }, - { - "epoch": 76.26, - "grad_norm": 66.27310943603516, - "learning_rate": 4.8680684226361624e-06, - "loss": 0.4376, - "step": 38130 - }, - { - "epoch": 76.32, - "grad_norm": 41.6434326171875, - "learning_rate": 4.861787530826979e-06, - "loss": 0.3979, - "step": 38160 - }, - { - "epoch": 76.38, - "grad_norm": 35.163848876953125, - "learning_rate": 4.85550685727415e-06, - "loss": 0.32, - "step": 38190 - }, - { - "epoch": 76.44, - "grad_norm": 39.82311248779297, - "learning_rate": 4.8492264118957165e-06, - "loss": 0.5402, - "step": 38220 - }, - { - "epoch": 76.5, - "grad_norm": 229.9091033935547, - "learning_rate": 4.842946204609359e-06, - "loss": 0.4054, - "step": 38250 - }, - { - "epoch": 76.56, - "grad_norm": 60.694252014160156, - "learning_rate": 4.8366662453323826e-06, - "loss": 0.3697, - "step": 38280 - }, - { - "epoch": 76.62, - "grad_norm": 55.6748046875, - "learning_rate": 4.830386543981696e-06, - "loss": 0.4069, - "step": 38310 - }, - { - "epoch": 76.68, - "grad_norm": 30.92841911315918, - "learning_rate": 4.8241071104738115e-06, - "loss": 0.418, - "step": 38340 - }, - { - "epoch": 76.74, - "grad_norm": 55.51054382324219, - "learning_rate": 4.8178279547248055e-06, - "loss": 0.643, - "step": 38370 - }, - { - "epoch": 76.8, - "grad_norm": 73.16288757324219, - "learning_rate": 4.811549086650327e-06, - "loss": 0.3539, - "step": 38400 - }, - { - "epoch": 76.86, - "grad_norm": 43.31676483154297, - "learning_rate": 4.805270516165564e-06, - "loss": 0.3947, - "step": 38430 - }, - { - "epoch": 76.92, - "grad_norm": 53.91853332519531, - "learning_rate": 4.798992253185233e-06, - "loss": 0.4008, - "step": 38460 - }, - { - "epoch": 76.98, - "grad_norm": 67.2529067993164, - "learning_rate": 4.792714307623574e-06, - "loss": 0.439, - "step": 38490 - }, - { - "epoch": 77.0, - "eval_loss": 0.3485209345817566, - "eval_map": 0.7617, - "eval_map_50": 0.9583, - "eval_map_75": 0.8965, - "eval_map_chicken": 0.7599, - "eval_map_duck": 0.6995, - "eval_map_large": 0.7814, - "eval_map_medium": 0.7633, - "eval_map_plant": 0.8257, - "eval_map_small": 0.213, - "eval_mar_1": 0.3039, - "eval_mar_10": 0.7998, - "eval_mar_100": 0.8063, - "eval_mar_100_chicken": 0.8036, - "eval_mar_100_duck": 0.7474, - "eval_mar_100_plant": 0.8679, - "eval_mar_large": 0.8302, - "eval_mar_medium": 0.8052, - "eval_mar_small": 0.3343, - "eval_runtime": 13.7577, - "eval_samples_per_second": 7.269, - "eval_steps_per_second": 0.945, - "step": 38500 - }, - { - "epoch": 77.04, - "grad_norm": 36.28005599975586, - "learning_rate": 4.786436689394317e-06, - "loss": 0.4211, - "step": 38520 - }, - { - "epoch": 77.1, - "grad_norm": 125.74197387695312, - "learning_rate": 4.780159408410677e-06, - "loss": 0.4807, - "step": 38550 - }, - { - "epoch": 77.16, - "grad_norm": 52.85602569580078, - "learning_rate": 4.773882474585338e-06, - "loss": 0.3429, - "step": 38580 - }, - { - "epoch": 77.22, - "grad_norm": 34.18029022216797, - "learning_rate": 4.767605897830436e-06, - "loss": 0.457, - "step": 38610 - }, - { - "epoch": 77.28, - "grad_norm": 106.94581604003906, - "learning_rate": 4.761329688057543e-06, - "loss": 0.4318, - "step": 38640 - }, - { - "epoch": 77.34, - "grad_norm": 66.56904602050781, - "learning_rate": 4.7550538551776495e-06, - "loss": 0.5025, - "step": 38670 - }, - { - "epoch": 77.4, - "grad_norm": 33.639957427978516, - "learning_rate": 4.748778409101153e-06, - "loss": 0.4006, - "step": 38700 - }, - { - "epoch": 77.46, - "grad_norm": 95.43140411376953, - "learning_rate": 4.742503359737841e-06, - "loss": 0.3822, - "step": 38730 - }, - { - "epoch": 77.52, - "grad_norm": 140.26458740234375, - "learning_rate": 4.736228716996868e-06, - "loss": 0.4077, - "step": 38760 - }, - { - "epoch": 77.58, - "grad_norm": 39.40882873535156, - "learning_rate": 4.7299544907867576e-06, - "loss": 0.3645, - "step": 38790 - }, - { - "epoch": 77.64, - "grad_norm": 355.2059326171875, - "learning_rate": 4.723680691015366e-06, - "loss": 0.4183, - "step": 38820 - }, - { - "epoch": 77.7, - "grad_norm": 93.6492919921875, - "learning_rate": 4.717407327589878e-06, - "loss": 0.3684, - "step": 38850 - }, - { - "epoch": 77.76, - "grad_norm": 64.07270050048828, - "learning_rate": 4.711134410416794e-06, - "loss": 0.4045, - "step": 38880 - }, - { - "epoch": 77.82, - "grad_norm": 46.11160659790039, - "learning_rate": 4.704861949401904e-06, - "loss": 0.4153, - "step": 38910 - }, - { - "epoch": 77.88, - "grad_norm": 59.16080093383789, - "learning_rate": 4.6985899544502835e-06, - "loss": 0.376, - "step": 38940 - }, - { - "epoch": 77.94, - "grad_norm": 47.295249938964844, - "learning_rate": 4.692318435466265e-06, - "loss": 0.4368, - "step": 38970 - }, - { - "epoch": 78.0, - "grad_norm": 57.80942916870117, - "learning_rate": 4.686047402353433e-06, - "loss": 0.4294, - "step": 39000 - }, - { - "epoch": 78.0, - "eval_loss": 0.3406044840812683, - "eval_map": 0.7562, - "eval_map_50": 0.947, - "eval_map_75": 0.8774, - "eval_map_chicken": 0.7478, - "eval_map_duck": 0.6802, - "eval_map_large": 0.7739, - "eval_map_medium": 0.7586, - "eval_map_plant": 0.8405, - "eval_map_small": 0.2508, - "eval_mar_1": 0.3044, - "eval_mar_10": 0.7915, - "eval_mar_100": 0.7994, - "eval_mar_100_chicken": 0.7917, - "eval_mar_100_duck": 0.7268, - "eval_mar_100_plant": 0.8797, - "eval_mar_large": 0.8081, - "eval_mar_medium": 0.8001, - "eval_mar_small": 0.3657, - "eval_runtime": 13.8773, - "eval_samples_per_second": 7.206, - "eval_steps_per_second": 0.937, - "step": 39000 - }, - { - "epoch": 78.06, - "grad_norm": 355.2297668457031, - "learning_rate": 4.679776865014609e-06, - "loss": 0.4002, - "step": 39030 - }, - { - "epoch": 78.12, - "grad_norm": 52.5995979309082, - "learning_rate": 4.673506833351821e-06, - "loss": 0.3932, - "step": 39060 - }, - { - "epoch": 78.18, - "grad_norm": 87.88226318359375, - "learning_rate": 4.667237317266311e-06, - "loss": 0.4794, - "step": 39090 - }, - { - "epoch": 78.24, - "grad_norm": 48.06367111206055, - "learning_rate": 4.660968326658497e-06, - "loss": 0.3785, - "step": 39120 - }, - { - "epoch": 78.3, - "grad_norm": 47.42380142211914, - "learning_rate": 4.654699871427972e-06, - "loss": 0.4504, - "step": 39150 - }, - { - "epoch": 78.36, - "grad_norm": 67.56281280517578, - "learning_rate": 4.648431961473482e-06, - "loss": 0.3373, - "step": 39180 - }, - { - "epoch": 78.42, - "grad_norm": 79.9132308959961, - "learning_rate": 4.642164606692912e-06, - "loss": 0.395, - "step": 39210 - }, - { - "epoch": 78.48, - "grad_norm": 216.938720703125, - "learning_rate": 4.635897816983272e-06, - "loss": 0.3761, - "step": 39240 - }, - { - "epoch": 78.54, - "grad_norm": 61.320316314697266, - "learning_rate": 4.629631602240678e-06, - "loss": 0.4511, - "step": 39270 - }, - { - "epoch": 78.6, - "grad_norm": 35.84014129638672, - "learning_rate": 4.6233659723603374e-06, - "loss": 0.3321, - "step": 39300 - }, - { - "epoch": 78.66, - "grad_norm": 48.47278594970703, - "learning_rate": 4.617100937236535e-06, - "loss": 0.3604, - "step": 39330 - }, - { - "epoch": 78.72, - "grad_norm": 16.092552185058594, - "learning_rate": 4.610836506762618e-06, - "loss": 0.3968, - "step": 39360 - }, - { - "epoch": 78.78, - "grad_norm": 49.87882614135742, - "learning_rate": 4.604572690830976e-06, - "loss": 0.3407, - "step": 39390 - }, - { - "epoch": 78.84, - "grad_norm": 71.10816192626953, - "learning_rate": 4.59830949933303e-06, - "loss": 0.4385, - "step": 39420 - }, - { - "epoch": 78.9, - "grad_norm": 30.709915161132812, - "learning_rate": 4.592046942159213e-06, - "loss": 0.4462, - "step": 39450 - }, - { - "epoch": 78.96, - "grad_norm": 147.6481475830078, - "learning_rate": 4.5857850291989596e-06, - "loss": 0.3643, - "step": 39480 - }, - { - "epoch": 79.0, - "eval_loss": 0.32853129506111145, - "eval_map": 0.7607, - "eval_map_50": 0.9492, - "eval_map_75": 0.8828, - "eval_map_chicken": 0.7602, - "eval_map_duck": 0.6911, - "eval_map_large": 0.7663, - "eval_map_medium": 0.7627, - "eval_map_plant": 0.8309, - "eval_map_small": 0.2242, - "eval_mar_1": 0.3047, - "eval_mar_10": 0.7998, - "eval_mar_100": 0.8045, - "eval_mar_100_chicken": 0.804, - "eval_mar_100_duck": 0.7402, - "eval_mar_100_plant": 0.8694, - "eval_mar_large": 0.809, - "eval_mar_medium": 0.8074, - "eval_mar_small": 0.3529, - "eval_runtime": 13.3554, - "eval_samples_per_second": 7.488, - "eval_steps_per_second": 0.973, - "step": 39500 - }, - { - "epoch": 79.02, - "grad_norm": 57.626468658447266, - "learning_rate": 4.579523770340681e-06, - "loss": 0.3743, - "step": 39510 - }, - { - "epoch": 79.08, - "grad_norm": 69.79145050048828, - "learning_rate": 4.573263175471766e-06, - "loss": 0.4185, - "step": 39540 - }, - { - "epoch": 79.14, - "grad_norm": 68.27862548828125, - "learning_rate": 4.567003254478545e-06, - "loss": 0.4065, - "step": 39570 - }, - { - "epoch": 79.2, - "grad_norm": 88.22193145751953, - "learning_rate": 4.560744017246284e-06, - "loss": 0.4247, - "step": 39600 - }, - { - "epoch": 79.26, - "grad_norm": 328.2776794433594, - "learning_rate": 4.55448547365918e-06, - "loss": 0.3754, - "step": 39630 - }, - { - "epoch": 79.32, - "grad_norm": 63.862327575683594, - "learning_rate": 4.548227633600322e-06, - "loss": 0.3743, - "step": 39660 - }, - { - "epoch": 79.38, - "grad_norm": 446.0810546875, - "learning_rate": 4.541970506951698e-06, - "loss": 0.3817, - "step": 39690 - }, - { - "epoch": 79.44, - "grad_norm": 59.019962310791016, - "learning_rate": 4.535714103594162e-06, - "loss": 0.4557, - "step": 39720 - }, - { - "epoch": 79.5, - "grad_norm": 53.41251754760742, - "learning_rate": 4.529458433407429e-06, - "loss": 0.4579, - "step": 39750 - }, - { - "epoch": 79.56, - "grad_norm": 54.333255767822266, - "learning_rate": 4.523203506270058e-06, - "loss": 0.4544, - "step": 39780 - }, - { - "epoch": 79.62, - "grad_norm": 62.91282272338867, - "learning_rate": 4.516949332059429e-06, - "loss": 0.4096, - "step": 39810 - }, - { - "epoch": 79.68, - "grad_norm": 27.472501754760742, - "learning_rate": 4.510695920651742e-06, - "loss": 0.4776, - "step": 39840 - }, - { - "epoch": 79.74, - "grad_norm": 59.355979919433594, - "learning_rate": 4.504443281921985e-06, - "loss": 0.4013, - "step": 39870 - }, - { - "epoch": 79.8, - "grad_norm": 68.70120239257812, - "learning_rate": 4.4981914257439254e-06, - "loss": 0.3891, - "step": 39900 - }, - { - "epoch": 79.86, - "grad_norm": 36.31624984741211, - "learning_rate": 4.491940361990101e-06, - "loss": 0.4313, - "step": 39930 - }, - { - "epoch": 79.92, - "grad_norm": 59.34695816040039, - "learning_rate": 4.485690100531793e-06, - "loss": 0.3352, - "step": 39960 - }, - { - "epoch": 79.98, - "grad_norm": 53.59098434448242, - "learning_rate": 4.4794406512390175e-06, - "loss": 0.3089, - "step": 39990 - }, - { - "epoch": 80.0, - "eval_loss": 0.3194189667701721, - "eval_map": 0.7734, - "eval_map_50": 0.9514, - "eval_map_75": 0.8911, - "eval_map_chicken": 0.773, - "eval_map_duck": 0.7036, - "eval_map_large": 0.808, - "eval_map_medium": 0.773, - "eval_map_plant": 0.8436, - "eval_map_small": 0.2526, - "eval_mar_1": 0.3087, - "eval_mar_10": 0.8092, - "eval_mar_100": 0.8163, - "eval_mar_100_chicken": 0.8175, - "eval_mar_100_duck": 0.7515, - "eval_mar_100_plant": 0.88, - "eval_mar_large": 0.8501, - "eval_mar_medium": 0.8168, - "eval_mar_small": 0.3805, - "eval_runtime": 12.5236, - "eval_samples_per_second": 7.985, - "eval_steps_per_second": 1.038, - "step": 40000 - }, - { - "epoch": 80.04, - "grad_norm": 65.6666488647461, - "learning_rate": 4.473192023980509e-06, - "loss": 0.4082, - "step": 40020 - }, - { - "epoch": 80.1, - "grad_norm": 43.5830078125, - "learning_rate": 4.466944228623701e-06, - "loss": 0.3798, - "step": 40050 - }, - { - "epoch": 80.16, - "grad_norm": 51.86589813232422, - "learning_rate": 4.460697275034717e-06, - "loss": 0.3908, - "step": 40080 - }, - { - "epoch": 80.22, - "grad_norm": 52.364742279052734, - "learning_rate": 4.454451173078347e-06, - "loss": 0.3591, - "step": 40110 - }, - { - "epoch": 80.28, - "grad_norm": 86.60858917236328, - "learning_rate": 4.448205932618042e-06, - "loss": 0.4148, - "step": 40140 - }, - { - "epoch": 80.34, - "grad_norm": 38.18660354614258, - "learning_rate": 4.4419615635158875e-06, - "loss": 0.3184, - "step": 40170 - }, - { - "epoch": 80.4, - "grad_norm": 65.76779174804688, - "learning_rate": 4.4357180756325915e-06, - "loss": 0.4159, - "step": 40200 - }, - { - "epoch": 80.46, - "grad_norm": 67.82655334472656, - "learning_rate": 4.42947547882748e-06, - "loss": 0.4103, - "step": 40230 - }, - { - "epoch": 80.52, - "grad_norm": 44.573997497558594, - "learning_rate": 4.423233782958459e-06, - "loss": 0.3903, - "step": 40260 - }, - { - "epoch": 80.58, - "grad_norm": 42.79051208496094, - "learning_rate": 4.416992997882023e-06, - "loss": 0.5362, - "step": 40290 - }, - { - "epoch": 80.64, - "grad_norm": 77.00391387939453, - "learning_rate": 4.410753133453222e-06, - "loss": 0.4555, - "step": 40320 - }, - { - "epoch": 80.7, - "grad_norm": 49.76982498168945, - "learning_rate": 4.404514199525651e-06, - "loss": 0.3536, - "step": 40350 - }, - { - "epoch": 80.76, - "grad_norm": 79.78474426269531, - "learning_rate": 4.398276205951443e-06, - "loss": 0.4245, - "step": 40380 - }, - { - "epoch": 80.82, - "grad_norm": 0.0004934342578053474, - "learning_rate": 4.392039162581239e-06, - "loss": 0.3957, - "step": 40410 - }, - { - "epoch": 80.88, - "grad_norm": 111.93219757080078, - "learning_rate": 4.38580307926418e-06, - "loss": 0.4646, - "step": 40440 - }, - { - "epoch": 80.94, - "grad_norm": 43.957115173339844, - "learning_rate": 4.379567965847896e-06, - "loss": 0.2984, - "step": 40470 - }, - { - "epoch": 81.0, - "grad_norm": 63.26675796508789, - "learning_rate": 4.373333832178478e-06, - "loss": 0.3825, - "step": 40500 - }, - { - "epoch": 81.0, - "eval_loss": 0.3217299282550812, - "eval_map": 0.7671, - "eval_map_50": 0.9532, - "eval_map_75": 0.8831, - "eval_map_chicken": 0.7627, - "eval_map_duck": 0.7031, - "eval_map_large": 0.8157, - "eval_map_medium": 0.7599, - "eval_map_plant": 0.8354, - "eval_map_small": 0.2602, - "eval_mar_1": 0.3076, - "eval_mar_10": 0.8079, - "eval_mar_100": 0.8136, - "eval_mar_100_chicken": 0.8147, - "eval_mar_100_duck": 0.7557, - "eval_mar_100_plant": 0.8703, - "eval_mar_large": 0.8615, - "eval_mar_medium": 0.8041, - "eval_mar_small": 0.3638, - "eval_runtime": 13.9519, - "eval_samples_per_second": 7.168, - "eval_steps_per_second": 0.932, - "step": 40500 - }, - { - "epoch": 81.06, - "grad_norm": 43.765098571777344, - "learning_rate": 4.36710068810048e-06, - "loss": 0.3538, - "step": 40530 - }, - { - "epoch": 81.12, - "grad_norm": 40.00071716308594, - "learning_rate": 4.360868543456883e-06, - "loss": 0.4956, - "step": 40560 - }, - { - "epoch": 81.18, - "grad_norm": 40.398956298828125, - "learning_rate": 4.354637408089093e-06, - "loss": 0.5314, - "step": 40590 - }, - { - "epoch": 81.24, - "grad_norm": 82.89373779296875, - "learning_rate": 4.348407291836928e-06, - "loss": 0.3578, - "step": 40620 - }, - { - "epoch": 81.3, - "grad_norm": 70.76558685302734, - "learning_rate": 4.342178204538588e-06, - "loss": 0.4374, - "step": 40650 - }, - { - "epoch": 81.36, - "grad_norm": 74.86760711669922, - "learning_rate": 4.335950156030653e-06, - "loss": 0.3958, - "step": 40680 - }, - { - "epoch": 81.42, - "grad_norm": 88.6963119506836, - "learning_rate": 4.329723156148064e-06, - "loss": 0.3679, - "step": 40710 - }, - { - "epoch": 81.48, - "grad_norm": 50.40531539916992, - "learning_rate": 4.323497214724099e-06, - "loss": 0.454, - "step": 40740 - }, - { - "epoch": 81.54, - "grad_norm": 53.5130615234375, - "learning_rate": 4.317272341590373e-06, - "loss": 0.3717, - "step": 40770 - }, - { - "epoch": 81.6, - "grad_norm": 59.9133415222168, - "learning_rate": 4.31104854657681e-06, - "loss": 0.4389, - "step": 40800 - }, - { - "epoch": 81.66, - "grad_norm": 31.516071319580078, - "learning_rate": 4.3048258395116326e-06, - "loss": 0.4058, - "step": 40830 - }, - { - "epoch": 81.72, - "grad_norm": 33.90363311767578, - "learning_rate": 4.298604230221341e-06, - "loss": 0.4415, - "step": 40860 - }, - { - "epoch": 81.78, - "grad_norm": 74.33262634277344, - "learning_rate": 4.2923837285307085e-06, - "loss": 0.3182, - "step": 40890 - }, - { - "epoch": 81.84, - "grad_norm": 40.281471252441406, - "learning_rate": 4.286164344262756e-06, - "loss": 0.4081, - "step": 40920 - }, - { - "epoch": 81.9, - "grad_norm": 31.47854995727539, - "learning_rate": 4.279946087238739e-06, - "loss": 0.3586, - "step": 40950 - }, - { - "epoch": 81.96, - "grad_norm": 39.215797424316406, - "learning_rate": 4.273728967278137e-06, - "loss": 0.465, - "step": 40980 - }, - { - "epoch": 82.0, - "eval_loss": 0.3319142162799835, - "eval_map": 0.7729, - "eval_map_50": 0.9571, - "eval_map_75": 0.8953, - "eval_map_chicken": 0.7579, - "eval_map_duck": 0.7203, - "eval_map_large": 0.812, - "eval_map_medium": 0.7677, - "eval_map_plant": 0.8404, - "eval_map_small": 0.2869, - "eval_mar_1": 0.3083, - "eval_mar_10": 0.8123, - "eval_mar_100": 0.8173, - "eval_mar_100_chicken": 0.8024, - "eval_mar_100_duck": 0.7711, - "eval_mar_100_plant": 0.8785, - "eval_mar_large": 0.8534, - "eval_mar_medium": 0.8111, - "eval_mar_small": 0.3862, - "eval_runtime": 12.8394, - "eval_samples_per_second": 7.789, - "eval_steps_per_second": 1.013, - "step": 41000 - }, - { - "epoch": 82.02, - "grad_norm": 0.0003232374438084662, - "learning_rate": 4.267512994198629e-06, - "loss": 0.4549, - "step": 41010 - }, - { - "epoch": 82.08, - "grad_norm": 53.96706771850586, - "learning_rate": 4.261298177816082e-06, - "loss": 0.3797, - "step": 41040 - }, - { - "epoch": 82.14, - "grad_norm": 32.9339485168457, - "learning_rate": 4.2550845279445455e-06, - "loss": 0.3341, - "step": 41070 - }, - { - "epoch": 82.2, - "grad_norm": 39.30419921875, - "learning_rate": 4.248872054396215e-06, - "loss": 0.3416, - "step": 41100 - }, - { - "epoch": 82.26, - "grad_norm": 62.170982360839844, - "learning_rate": 4.242660766981439e-06, - "loss": 0.3309, - "step": 41130 - }, - { - "epoch": 82.32, - "grad_norm": 41.5063591003418, - "learning_rate": 4.2364506755086856e-06, - "loss": 0.5078, - "step": 41160 - }, - { - "epoch": 82.38, - "grad_norm": 5.863053593202494e-05, - "learning_rate": 4.230241789784535e-06, - "loss": 0.4363, - "step": 41190 - }, - { - "epoch": 82.44, - "grad_norm": 64.28311157226562, - "learning_rate": 4.224034119613671e-06, - "loss": 0.3373, - "step": 41220 - }, - { - "epoch": 82.5, - "grad_norm": 43.275230407714844, - "learning_rate": 4.217827674798845e-06, - "loss": 0.3243, - "step": 41250 - }, - { - "epoch": 82.56, - "grad_norm": 49.93529510498047, - "learning_rate": 4.211622465140887e-06, - "loss": 0.4209, - "step": 41280 - }, - { - "epoch": 82.62, - "grad_norm": 118.22904968261719, - "learning_rate": 4.2054185004386675e-06, - "loss": 0.3981, - "step": 41310 - }, - { - "epoch": 82.68, - "grad_norm": 49.88104248046875, - "learning_rate": 4.199215790489091e-06, - "loss": 0.4734, - "step": 41340 - }, - { - "epoch": 82.74, - "grad_norm": 37.37254333496094, - "learning_rate": 4.193014345087088e-06, - "loss": 0.44, - "step": 41370 - }, - { - "epoch": 82.8, - "grad_norm": 122.6294174194336, - "learning_rate": 4.186814174025582e-06, - "loss": 0.3874, - "step": 41400 - }, - { - "epoch": 82.86, - "grad_norm": 73.6717529296875, - "learning_rate": 4.180615287095494e-06, - "loss": 0.4097, - "step": 41430 - }, - { - "epoch": 82.92, - "grad_norm": 52.6181640625, - "learning_rate": 4.174417694085711e-06, - "loss": 0.433, - "step": 41460 - }, - { - "epoch": 82.98, - "grad_norm": 34.0953483581543, - "learning_rate": 4.168221404783076e-06, - "loss": 0.3699, - "step": 41490 - }, - { - "epoch": 83.0, - "eval_loss": 0.33553847670555115, - "eval_map": 0.7681, - "eval_map_50": 0.9404, - "eval_map_75": 0.8881, - "eval_map_chicken": 0.7788, - "eval_map_duck": 0.7036, - "eval_map_large": 0.7947, - "eval_map_medium": 0.7663, - "eval_map_plant": 0.8218, - "eval_map_small": 0.2056, - "eval_mar_1": 0.3088, - "eval_mar_10": 0.8062, - "eval_mar_100": 0.8112, - "eval_mar_100_chicken": 0.8246, - "eval_mar_100_duck": 0.7443, - "eval_mar_100_plant": 0.8645, - "eval_mar_large": 0.8387, - "eval_mar_medium": 0.809, - "eval_mar_small": 0.2671, - "eval_runtime": 13.4811, - "eval_samples_per_second": 7.418, - "eval_steps_per_second": 0.964, - "step": 41500 - }, - { - "epoch": 83.04, - "grad_norm": 44.96345138549805, - "learning_rate": 4.16202642897238e-06, - "loss": 0.4554, - "step": 41520 - }, - { - "epoch": 83.1, - "grad_norm": 222.92185974121094, - "learning_rate": 4.155832776436331e-06, - "loss": 0.3129, - "step": 41550 - }, - { - "epoch": 83.16, - "grad_norm": 106.24298095703125, - "learning_rate": 4.149640456955555e-06, - "loss": 0.4211, - "step": 41580 - }, - { - "epoch": 83.22, - "grad_norm": 84.29071044921875, - "learning_rate": 4.143449480308569e-06, - "loss": 0.3587, - "step": 41610 - }, - { - "epoch": 83.28, - "grad_norm": 49.473636627197266, - "learning_rate": 4.137259856271767e-06, - "loss": 0.4076, - "step": 41640 - }, - { - "epoch": 83.34, - "grad_norm": 79.51416778564453, - "learning_rate": 4.131071594619416e-06, - "loss": 0.4051, - "step": 41670 - }, - { - "epoch": 83.4, - "grad_norm": 135.29965209960938, - "learning_rate": 4.124884705123619e-06, - "loss": 0.4615, - "step": 41700 - }, - { - "epoch": 83.46, - "grad_norm": 73.52564239501953, - "learning_rate": 4.118699197554327e-06, - "loss": 0.4144, - "step": 41730 - }, - { - "epoch": 83.52, - "grad_norm": 0.0007346854545176029, - "learning_rate": 4.112515081679295e-06, - "loss": 0.4484, - "step": 41760 - }, - { - "epoch": 83.58, - "grad_norm": 66.4422836303711, - "learning_rate": 4.106332367264085e-06, - "loss": 0.3751, - "step": 41790 - }, - { - "epoch": 83.64, - "grad_norm": 54.533084869384766, - "learning_rate": 4.1001510640720525e-06, - "loss": 0.4054, - "step": 41820 - }, - { - "epoch": 83.7, - "grad_norm": 68.78630065917969, - "learning_rate": 4.093971181864313e-06, - "loss": 0.3498, - "step": 41850 - }, - { - "epoch": 83.76, - "grad_norm": 119.73062133789062, - "learning_rate": 4.087792730399749e-06, - "loss": 0.4177, - "step": 41880 - }, - { - "epoch": 83.82, - "grad_norm": 85.17146301269531, - "learning_rate": 4.081615719434978e-06, - "loss": 0.4026, - "step": 41910 - }, - { - "epoch": 83.88, - "grad_norm": 69.35352325439453, - "learning_rate": 4.075440158724339e-06, - "loss": 0.3724, - "step": 41940 - }, - { - "epoch": 83.94, - "grad_norm": 49.73758316040039, - "learning_rate": 4.0692660580198905e-06, - "loss": 0.3721, - "step": 41970 - }, - { - "epoch": 84.0, - "grad_norm": 86.88200378417969, - "learning_rate": 4.063093427071376e-06, - "loss": 0.4712, - "step": 42000 - }, - { - "epoch": 84.0, - "eval_loss": 0.35030093789100647, - "eval_map": 0.7537, - "eval_map_50": 0.9542, - "eval_map_75": 0.8957, - "eval_map_chicken": 0.7472, - "eval_map_duck": 0.6924, - "eval_map_large": 0.7776, - "eval_map_medium": 0.7501, - "eval_map_plant": 0.8214, - "eval_map_small": 0.2904, - "eval_mar_1": 0.3017, - "eval_mar_10": 0.7948, - "eval_mar_100": 0.8006, - "eval_mar_100_chicken": 0.7984, - "eval_mar_100_duck": 0.7423, - "eval_mar_100_plant": 0.8612, - "eval_mar_large": 0.8247, - "eval_mar_medium": 0.7959, - "eval_mar_small": 0.3829, - "eval_runtime": 14.0954, - "eval_samples_per_second": 7.095, - "eval_steps_per_second": 0.922, - "step": 42000 - }, - { - "epoch": 84.06, - "grad_norm": 53.9143180847168, - "learning_rate": 4.056922275626227e-06, - "loss": 0.4626, - "step": 42030 - }, - { - "epoch": 84.12, - "grad_norm": 30.344152450561523, - "learning_rate": 4.0507526134295314e-06, - "loss": 0.3654, - "step": 42060 - }, - { - "epoch": 84.18, - "grad_norm": 80.7647705078125, - "learning_rate": 4.044584450224026e-06, - "loss": 0.3983, - "step": 42090 - }, - { - "epoch": 84.24, - "grad_norm": 75.35958099365234, - "learning_rate": 4.038417795750086e-06, - "loss": 0.4443, - "step": 42120 - }, - { - "epoch": 84.3, - "grad_norm": 41.08534240722656, - "learning_rate": 4.032252659745699e-06, - "loss": 0.48, - "step": 42150 - }, - { - "epoch": 84.36, - "grad_norm": 54.23200225830078, - "learning_rate": 4.0260890519464565e-06, - "loss": 0.3444, - "step": 42180 - }, - { - "epoch": 84.42, - "grad_norm": 30.99652671813965, - "learning_rate": 4.019926982085536e-06, - "loss": 0.3804, - "step": 42210 - }, - { - "epoch": 84.48, - "grad_norm": 91.6404800415039, - "learning_rate": 4.013766459893686e-06, - "loss": 0.4213, - "step": 42240 - }, - { - "epoch": 84.54, - "grad_norm": 5.198516373638995e-05, - "learning_rate": 4.007607495099215e-06, - "loss": 0.4046, - "step": 42270 - }, - { - "epoch": 84.6, - "grad_norm": 68.38336181640625, - "learning_rate": 4.001450097427965e-06, - "loss": 0.384, - "step": 42300 - }, - { - "epoch": 84.66, - "grad_norm": 59.46340560913086, - "learning_rate": 3.995294276603312e-06, - "loss": 0.4065, - "step": 42330 - }, - { - "epoch": 84.72, - "grad_norm": 44.93857955932617, - "learning_rate": 3.989140042346134e-06, - "loss": 0.3444, - "step": 42360 - }, - { - "epoch": 84.78, - "grad_norm": 35.59174346923828, - "learning_rate": 3.9829874043748064e-06, - "loss": 0.3326, - "step": 42390 - }, - { - "epoch": 84.84, - "grad_norm": 77.32077026367188, - "learning_rate": 3.9768363724051875e-06, - "loss": 0.3777, - "step": 42420 - }, - { - "epoch": 84.9, - "grad_norm": 45.49907302856445, - "learning_rate": 3.970686956150595e-06, - "loss": 0.3798, - "step": 42450 - }, - { - "epoch": 84.96, - "grad_norm": 47.95565414428711, - "learning_rate": 3.964539165321795e-06, - "loss": 0.3711, - "step": 42480 - }, - { - "epoch": 85.0, - "eval_loss": 0.3333532214164734, - "eval_map": 0.7686, - "eval_map_50": 0.9549, - "eval_map_75": 0.8986, - "eval_map_chicken": 0.7423, - "eval_map_duck": 0.7212, - "eval_map_large": 0.8073, - "eval_map_medium": 0.7664, - "eval_map_plant": 0.8425, - "eval_map_small": 0.2611, - "eval_mar_1": 0.3066, - "eval_mar_10": 0.8066, - "eval_mar_100": 0.8126, - "eval_mar_100_chicken": 0.7905, - "eval_mar_100_duck": 0.768, - "eval_mar_100_plant": 0.8794, - "eval_mar_large": 0.8506, - "eval_mar_medium": 0.8067, - "eval_mar_small": 0.3724, - "eval_runtime": 14.0319, - "eval_samples_per_second": 7.127, - "eval_steps_per_second": 0.926, - "step": 42500 - }, - { - "epoch": 85.02, - "grad_norm": 39.73072052001953, - "learning_rate": 3.95839300962699e-06, - "loss": 0.3812, - "step": 42510 - }, - { - "epoch": 85.08, - "grad_norm": 63.30912780761719, - "learning_rate": 3.952248498771797e-06, - "loss": 0.3835, - "step": 42540 - }, - { - "epoch": 85.14, - "grad_norm": 60.497249603271484, - "learning_rate": 3.946105642459241e-06, - "loss": 0.3994, - "step": 42570 - }, - { - "epoch": 85.2, - "grad_norm": 72.43930053710938, - "learning_rate": 3.939964450389728e-06, - "loss": 0.3594, - "step": 42600 - }, - { - "epoch": 85.26, - "grad_norm": 48.033729553222656, - "learning_rate": 3.9338249322610375e-06, - "loss": 0.3904, - "step": 42630 - }, - { - "epoch": 85.32, - "grad_norm": 3.571917841327377e-05, - "learning_rate": 3.927687097768309e-06, - "loss": 0.3841, - "step": 42660 - }, - { - "epoch": 85.38, - "grad_norm": 136.57557678222656, - "learning_rate": 3.921550956604019e-06, - "loss": 0.3325, - "step": 42690 - }, - { - "epoch": 85.44, - "grad_norm": 45.00989532470703, - "learning_rate": 3.915416518457974e-06, - "loss": 0.4605, - "step": 42720 - }, - { - "epoch": 85.5, - "grad_norm": 151.85511779785156, - "learning_rate": 3.909283793017289e-06, - "loss": 0.3987, - "step": 42750 - }, - { - "epoch": 85.56, - "grad_norm": 158.4957733154297, - "learning_rate": 3.9031527899663705e-06, - "loss": 0.4373, - "step": 42780 - }, - { - "epoch": 85.62, - "grad_norm": 32.463966369628906, - "learning_rate": 3.897023518986915e-06, - "loss": 0.4533, - "step": 42810 - }, - { - "epoch": 85.68, - "grad_norm": 91.0557861328125, - "learning_rate": 3.890895989757874e-06, - "loss": 0.3048, - "step": 42840 - }, - { - "epoch": 85.74, - "grad_norm": 88.0126953125, - "learning_rate": 3.884770211955454e-06, - "loss": 0.392, - "step": 42870 - }, - { - "epoch": 85.8, - "grad_norm": 90.39067077636719, - "learning_rate": 3.8786461952530955e-06, - "loss": 0.5168, - "step": 42900 - }, - { - "epoch": 85.86, - "grad_norm": 76.5845718383789, - "learning_rate": 3.872523949321454e-06, - "loss": 0.3717, - "step": 42930 - }, - { - "epoch": 85.92, - "grad_norm": 93.90611267089844, - "learning_rate": 3.866403483828392e-06, - "loss": 0.3961, - "step": 42960 - }, - { - "epoch": 85.98, - "grad_norm": 85.02204132080078, - "learning_rate": 3.860284808438962e-06, - "loss": 0.4093, - "step": 42990 - }, - { - "epoch": 86.0, - "eval_loss": 0.3298526406288147, - "eval_map": 0.7711, - "eval_map_50": 0.9535, - "eval_map_75": 0.8948, - "eval_map_chicken": 0.7478, - "eval_map_duck": 0.7176, - "eval_map_large": 0.8096, - "eval_map_medium": 0.7678, - "eval_map_plant": 0.8478, - "eval_map_small": 0.2808, - "eval_mar_1": 0.31, - "eval_mar_10": 0.8091, - "eval_mar_100": 0.8156, - "eval_mar_100_chicken": 0.7996, - "eval_mar_100_duck": 0.7629, - "eval_mar_100_plant": 0.8842, - "eval_mar_large": 0.8489, - "eval_mar_medium": 0.8098, - "eval_mar_small": 0.3848, - "eval_runtime": 13.2107, - "eval_samples_per_second": 7.57, - "eval_steps_per_second": 0.984, - "step": 43000 - }, - { - "epoch": 86.04, - "grad_norm": 73.50428771972656, - "learning_rate": 3.854167932815387e-06, - "loss": 0.3526, - "step": 43020 - }, - { - "epoch": 86.1, - "grad_norm": 56.092628479003906, - "learning_rate": 3.8480528666170495e-06, - "loss": 0.3843, - "step": 43050 - }, - { - "epoch": 86.16, - "grad_norm": 59.24781036376953, - "learning_rate": 3.841939619500468e-06, - "loss": 0.4454, - "step": 43080 - }, - { - "epoch": 86.22, - "grad_norm": 52.54795455932617, - "learning_rate": 3.835828201119302e-06, - "loss": 0.3502, - "step": 43110 - }, - { - "epoch": 86.28, - "grad_norm": 46.815635681152344, - "learning_rate": 3.8297186211243085e-06, - "loss": 0.4507, - "step": 43140 - }, - { - "epoch": 86.34, - "grad_norm": 32.43108367919922, - "learning_rate": 3.823610889163354e-06, - "loss": 0.4188, - "step": 43170 - }, - { - "epoch": 86.4, - "grad_norm": 52.47710037231445, - "learning_rate": 3.817505014881378e-06, - "loss": 0.3677, - "step": 43200 - }, - { - "epoch": 86.46, - "grad_norm": 69.88518524169922, - "learning_rate": 3.8114010079203877e-06, - "loss": 0.4521, - "step": 43230 - }, - { - "epoch": 86.52, - "grad_norm": 44.97297668457031, - "learning_rate": 3.8052988779194478e-06, - "loss": 0.4146, - "step": 43260 - }, - { - "epoch": 86.58, - "grad_norm": 54.33777618408203, - "learning_rate": 3.7991986345146503e-06, - "loss": 0.4564, - "step": 43290 - }, - { - "epoch": 86.64, - "grad_norm": 60.42967987060547, - "learning_rate": 3.7931002873391156e-06, - "loss": 0.4434, - "step": 43320 - }, - { - "epoch": 86.7, - "grad_norm": 39.14558792114258, - "learning_rate": 3.787003846022964e-06, - "loss": 0.3712, - "step": 43350 - }, - { - "epoch": 86.76, - "grad_norm": 40.65776062011719, - "learning_rate": 3.7809093201933078e-06, - "loss": 0.3638, - "step": 43380 - }, - { - "epoch": 86.82, - "grad_norm": 41.96371841430664, - "learning_rate": 3.774816719474238e-06, - "loss": 0.4215, - "step": 43410 - }, - { - "epoch": 86.88, - "grad_norm": 29.773893356323242, - "learning_rate": 3.7687260534868e-06, - "loss": 0.3284, - "step": 43440 - }, - { - "epoch": 86.94, - "grad_norm": 29.671260833740234, - "learning_rate": 3.762637331848989e-06, - "loss": 0.4451, - "step": 43470 - }, - { - "epoch": 87.0, - "grad_norm": 109.13446044921875, - "learning_rate": 3.756550564175727e-06, - "loss": 0.447, - "step": 43500 - }, - { - "epoch": 87.0, - "eval_loss": 0.3273865878582001, - "eval_map": 0.7718, - "eval_map_50": 0.9547, - "eval_map_75": 0.8992, - "eval_map_chicken": 0.7686, - "eval_map_duck": 0.7125, - "eval_map_large": 0.8004, - "eval_map_medium": 0.7699, - "eval_map_plant": 0.8343, - "eval_map_small": 0.2794, - "eval_mar_1": 0.3086, - "eval_mar_10": 0.8129, - "eval_mar_100": 0.8177, - "eval_mar_100_chicken": 0.8151, - "eval_mar_100_duck": 0.7639, - "eval_mar_100_plant": 0.8742, - "eval_mar_large": 0.8445, - "eval_mar_medium": 0.8106, - "eval_mar_small": 0.3738, - "eval_runtime": 14.4819, - "eval_samples_per_second": 6.905, - "eval_steps_per_second": 0.898, - "step": 43500 - }, - { - "epoch": 87.06, - "grad_norm": 48.34268569946289, - "learning_rate": 3.7504657600788484e-06, - "loss": 0.3533, - "step": 43530 - }, - { - "epoch": 87.12, - "grad_norm": 93.21697998046875, - "learning_rate": 3.744382929167094e-06, - "loss": 0.4566, - "step": 43560 - }, - { - "epoch": 87.18, - "grad_norm": 75.50614929199219, - "learning_rate": 3.73830208104608e-06, - "loss": 0.4309, - "step": 43590 - }, - { - "epoch": 87.24, - "grad_norm": 0.00020948913879692554, - "learning_rate": 3.7322232253182984e-06, - "loss": 0.3898, - "step": 43620 - }, - { - "epoch": 87.3, - "grad_norm": 95.0788803100586, - "learning_rate": 3.7261463715830902e-06, - "loss": 0.3298, - "step": 43650 - }, - { - "epoch": 87.36, - "grad_norm": 193.90707397460938, - "learning_rate": 3.7200715294366376e-06, - "loss": 0.4115, - "step": 43680 - }, - { - "epoch": 87.42, - "grad_norm": 78.2755355834961, - "learning_rate": 3.7139987084719463e-06, - "loss": 0.4018, - "step": 43710 - }, - { - "epoch": 87.48, - "grad_norm": 60.400638580322266, - "learning_rate": 3.7079279182788263e-06, - "loss": 0.3891, - "step": 43740 - }, - { - "epoch": 87.54, - "grad_norm": 38.12732696533203, - "learning_rate": 3.70185916844389e-06, - "loss": 0.3482, - "step": 43770 - }, - { - "epoch": 87.6, - "grad_norm": 48.90447235107422, - "learning_rate": 3.695792468550517e-06, - "loss": 0.4548, - "step": 43800 - }, - { - "epoch": 87.66, - "grad_norm": 45.640445709228516, - "learning_rate": 3.689727828178854e-06, - "loss": 0.3963, - "step": 43830 - }, - { - "epoch": 87.72, - "grad_norm": 26.108816146850586, - "learning_rate": 3.6836652569057994e-06, - "loss": 0.3491, - "step": 43860 - }, - { - "epoch": 87.78, - "grad_norm": 104.40931701660156, - "learning_rate": 3.6776047643049777e-06, - "loss": 0.4184, - "step": 43890 - }, - { - "epoch": 87.84, - "grad_norm": 49.7859992980957, - "learning_rate": 3.6715463599467372e-06, - "loss": 0.4433, - "step": 43920 - }, - { - "epoch": 87.9, - "grad_norm": 63.1917839050293, - "learning_rate": 3.6654900533981234e-06, - "loss": 0.4859, - "step": 43950 - }, - { - "epoch": 87.96, - "grad_norm": 125.78496551513672, - "learning_rate": 3.659435854222869e-06, - "loss": 0.3878, - "step": 43980 - }, - { - "epoch": 88.0, - "eval_loss": 0.3161975145339966, - "eval_map": 0.7836, - "eval_map_50": 0.9558, - "eval_map_75": 0.9025, - "eval_map_chicken": 0.7758, - "eval_map_duck": 0.7307, - "eval_map_large": 0.8195, - "eval_map_medium": 0.7785, - "eval_map_plant": 0.8442, - "eval_map_small": 0.2726, - "eval_mar_1": 0.3138, - "eval_mar_10": 0.8202, - "eval_mar_100": 0.8262, - "eval_mar_100_chicken": 0.8206, - "eval_mar_100_duck": 0.7763, - "eval_mar_100_plant": 0.8818, - "eval_mar_large": 0.8567, - "eval_mar_medium": 0.8201, - "eval_mar_small": 0.3805, - "eval_runtime": 12.578, - "eval_samples_per_second": 7.95, - "eval_steps_per_second": 1.034, - "step": 44000 - }, - { - "epoch": 88.02, - "grad_norm": 103.24290466308594, - "learning_rate": 3.653383771981385e-06, - "loss": 0.4455, - "step": 44010 - }, - { - "epoch": 88.08, - "grad_norm": 84.60028839111328, - "learning_rate": 3.6473338162307314e-06, - "loss": 0.434, - "step": 44040 - }, - { - "epoch": 88.14, - "grad_norm": 44.8115234375, - "learning_rate": 3.6412859965246173e-06, - "loss": 0.3777, - "step": 44070 - }, - { - "epoch": 88.2, - "grad_norm": 71.17977142333984, - "learning_rate": 3.635240322413375e-06, - "loss": 0.4282, - "step": 44100 - }, - { - "epoch": 88.26, - "grad_norm": 80.82675170898438, - "learning_rate": 3.6291968034439463e-06, - "loss": 0.3941, - "step": 44130 - }, - { - "epoch": 88.32, - "grad_norm": 59.04813003540039, - "learning_rate": 3.6231554491598766e-06, - "loss": 0.3542, - "step": 44160 - }, - { - "epoch": 88.38, - "grad_norm": 97.56294250488281, - "learning_rate": 3.617116269101286e-06, - "loss": 0.3248, - "step": 44190 - }, - { - "epoch": 88.44, - "grad_norm": 42.90022659301758, - "learning_rate": 3.6110792728048636e-06, - "loss": 0.4781, - "step": 44220 - }, - { - "epoch": 88.5, - "grad_norm": 55.824066162109375, - "learning_rate": 3.6050444698038547e-06, - "loss": 0.3814, - "step": 44250 - }, - { - "epoch": 88.56, - "grad_norm": 0.0001099341970984824, - "learning_rate": 3.599011869628033e-06, - "loss": 0.4042, - "step": 44280 - }, - { - "epoch": 88.62, - "grad_norm": 84.20889282226562, - "learning_rate": 3.592981481803699e-06, - "loss": 0.3713, - "step": 44310 - }, - { - "epoch": 88.68, - "grad_norm": 94.83952331542969, - "learning_rate": 3.5869533158536583e-06, - "loss": 0.3942, - "step": 44340 - }, - { - "epoch": 88.74, - "grad_norm": 79.83787536621094, - "learning_rate": 3.5809273812972078e-06, - "loss": 0.4026, - "step": 44370 - }, - { - "epoch": 88.8, - "grad_norm": 51.58283233642578, - "learning_rate": 3.5749036876501196e-06, - "loss": 0.3962, - "step": 44400 - }, - { - "epoch": 88.86, - "grad_norm": 77.16682434082031, - "learning_rate": 3.5688822444246297e-06, - "loss": 0.4762, - "step": 44430 - }, - { - "epoch": 88.92, - "grad_norm": 45.30950927734375, - "learning_rate": 3.562863061129419e-06, - "loss": 0.4095, - "step": 44460 - }, - { - "epoch": 88.98, - "grad_norm": 31.94639015197754, - "learning_rate": 3.556846147269598e-06, - "loss": 0.3293, - "step": 44490 - }, - { - "epoch": 89.0, - "eval_loss": 0.3279344439506531, - "eval_map": 0.7753, - "eval_map_50": 0.9585, - "eval_map_75": 0.8908, - "eval_map_chicken": 0.76, - "eval_map_duck": 0.7257, - "eval_map_large": 0.8023, - "eval_map_medium": 0.7729, - "eval_map_plant": 0.8403, - "eval_map_small": 0.2607, - "eval_mar_1": 0.3112, - "eval_mar_10": 0.8129, - "eval_mar_100": 0.8193, - "eval_mar_100_chicken": 0.8095, - "eval_mar_100_duck": 0.7732, - "eval_mar_100_plant": 0.8752, - "eval_mar_large": 0.8371, - "eval_mar_medium": 0.8182, - "eval_mar_small": 0.3748, - "eval_runtime": 17.7473, - "eval_samples_per_second": 5.635, - "eval_steps_per_second": 0.733, - "step": 44500 - }, - { - "epoch": 89.04, - "grad_norm": 36.628517150878906, - "learning_rate": 3.550831512346695e-06, - "loss": 0.3556, - "step": 44520 - }, - { - "epoch": 89.1, - "grad_norm": 99.59779357910156, - "learning_rate": 3.5448191658586423e-06, - "loss": 0.4123, - "step": 44550 - }, - { - "epoch": 89.16, - "grad_norm": 34.27329635620117, - "learning_rate": 3.538809117299751e-06, - "loss": 0.5333, - "step": 44580 - }, - { - "epoch": 89.22, - "grad_norm": 43.351253509521484, - "learning_rate": 3.532801376160713e-06, - "loss": 0.3547, - "step": 44610 - }, - { - "epoch": 89.28, - "grad_norm": 87.09569549560547, - "learning_rate": 3.526795951928569e-06, - "loss": 0.4303, - "step": 44640 - }, - { - "epoch": 89.34, - "grad_norm": 40.55412673950195, - "learning_rate": 3.520792854086702e-06, - "loss": 0.4896, - "step": 44670 - }, - { - "epoch": 89.4, - "grad_norm": 0.00017987802857533097, - "learning_rate": 3.5147920921148267e-06, - "loss": 0.3599, - "step": 44700 - }, - { - "epoch": 89.46, - "grad_norm": 113.14846801757812, - "learning_rate": 3.5087936754889614e-06, - "loss": 0.4684, - "step": 44730 - }, - { - "epoch": 89.52, - "grad_norm": 44.751216888427734, - "learning_rate": 3.502797613681429e-06, - "loss": 0.375, - "step": 44760 - }, - { - "epoch": 89.58, - "grad_norm": 60.96277618408203, - "learning_rate": 3.496803916160827e-06, - "loss": 0.3559, - "step": 44790 - }, - { - "epoch": 89.64, - "grad_norm": 53.7309684753418, - "learning_rate": 3.4908125923920204e-06, - "loss": 0.3498, - "step": 44820 - }, - { - "epoch": 89.7, - "grad_norm": 51.482662200927734, - "learning_rate": 3.484823651836131e-06, - "loss": 0.4061, - "step": 44850 - }, - { - "epoch": 89.76, - "grad_norm": 139.41561889648438, - "learning_rate": 3.478837103950509e-06, - "loss": 0.3898, - "step": 44880 - }, - { - "epoch": 89.82, - "grad_norm": 35.693016052246094, - "learning_rate": 3.472852958188736e-06, - "loss": 0.3961, - "step": 44910 - }, - { - "epoch": 89.88, - "grad_norm": 29.292320251464844, - "learning_rate": 3.4668712240005912e-06, - "loss": 0.4392, - "step": 44940 - }, - { - "epoch": 89.94, - "grad_norm": 63.4970817565918, - "learning_rate": 3.4608919108320488e-06, - "loss": 0.4191, - "step": 44970 - }, - { - "epoch": 90.0, - "grad_norm": 130.6688995361328, - "learning_rate": 3.4549150281252635e-06, - "loss": 0.279, - "step": 45000 - }, - { - "epoch": 90.0, - "eval_loss": 0.3147023320198059, - "eval_map": 0.7774, - "eval_map_50": 0.9502, - "eval_map_75": 0.8862, - "eval_map_chicken": 0.7737, - "eval_map_duck": 0.7143, - "eval_map_large": 0.8075, - "eval_map_medium": 0.7753, - "eval_map_plant": 0.8442, - "eval_map_small": 0.2608, - "eval_mar_1": 0.3091, - "eval_mar_10": 0.8166, - "eval_mar_100": 0.8217, - "eval_mar_100_chicken": 0.821, - "eval_mar_100_duck": 0.7608, - "eval_mar_100_plant": 0.8833, - "eval_mar_large": 0.8512, - "eval_mar_medium": 0.8164, - "eval_mar_small": 0.351, - "eval_runtime": 13.2431, - "eval_samples_per_second": 7.551, - "eval_steps_per_second": 0.982, - "step": 45000 - }, - { - "epoch": 90.06, - "grad_norm": 31.652523040771484, - "learning_rate": 3.4489405853185465e-06, - "loss": 0.4461, - "step": 45030 - }, - { - "epoch": 90.12, - "grad_norm": 54.40607452392578, - "learning_rate": 3.442968591846359e-06, - "loss": 0.3232, - "step": 45060 - }, - { - "epoch": 90.18, - "grad_norm": 22.42218589782715, - "learning_rate": 3.436999057139295e-06, - "loss": 0.3202, - "step": 45090 - }, - { - "epoch": 90.24, - "grad_norm": 403.88385009765625, - "learning_rate": 3.431031990624063e-06, - "loss": 0.4488, - "step": 45120 - }, - { - "epoch": 90.3, - "grad_norm": 31.73854637145996, - "learning_rate": 3.4250674017234774e-06, - "loss": 0.2749, - "step": 45150 - }, - { - "epoch": 90.36, - "grad_norm": 86.20687103271484, - "learning_rate": 3.4191052998564344e-06, - "loss": 0.3923, - "step": 45180 - }, - { - "epoch": 90.42, - "grad_norm": 156.41319274902344, - "learning_rate": 3.4131456944379126e-06, - "loss": 0.4246, - "step": 45210 - }, - { - "epoch": 90.48, - "grad_norm": 345.8996276855469, - "learning_rate": 3.407188594878938e-06, - "loss": 0.3513, - "step": 45240 - }, - { - "epoch": 90.54, - "grad_norm": 72.64080047607422, - "learning_rate": 3.401234010586583e-06, - "loss": 0.3544, - "step": 45270 - }, - { - "epoch": 90.6, - "grad_norm": 53.70094299316406, - "learning_rate": 3.3952819509639534e-06, - "loss": 0.3916, - "step": 45300 - }, - { - "epoch": 90.66, - "grad_norm": 36.67252731323242, - "learning_rate": 3.38933242541016e-06, - "loss": 0.3854, - "step": 45330 - }, - { - "epoch": 90.72, - "grad_norm": 60.829288482666016, - "learning_rate": 3.3833854433203185e-06, - "loss": 0.3689, - "step": 45360 - }, - { - "epoch": 90.78, - "grad_norm": 38.895896911621094, - "learning_rate": 3.377441014085524e-06, - "loss": 0.4459, - "step": 45390 - }, - { - "epoch": 90.84, - "grad_norm": 121.845947265625, - "learning_rate": 3.3714991470928393e-06, - "loss": 0.4464, - "step": 45420 - }, - { - "epoch": 90.9, - "grad_norm": 167.4103240966797, - "learning_rate": 3.3655598517252886e-06, - "loss": 0.4413, - "step": 45450 - }, - { - "epoch": 90.96, - "grad_norm": 34.13265609741211, - "learning_rate": 3.359623137361825e-06, - "loss": 0.339, - "step": 45480 - }, - { - "epoch": 91.0, - "eval_loss": 0.31199073791503906, - "eval_map": 0.7779, - "eval_map_50": 0.9532, - "eval_map_75": 0.8949, - "eval_map_chicken": 0.7784, - "eval_map_duck": 0.7125, - "eval_map_large": 0.8047, - "eval_map_medium": 0.7732, - "eval_map_plant": 0.8428, - "eval_map_small": 0.2683, - "eval_mar_1": 0.3094, - "eval_mar_10": 0.8169, - "eval_mar_100": 0.8225, - "eval_mar_100_chicken": 0.8262, - "eval_mar_100_duck": 0.7598, - "eval_mar_100_plant": 0.8815, - "eval_mar_large": 0.8504, - "eval_mar_medium": 0.8181, - "eval_mar_small": 0.3881, - "eval_runtime": 14.2049, - "eval_samples_per_second": 7.04, - "eval_steps_per_second": 0.915, - "step": 45500 - }, - { - "epoch": 91.02, - "grad_norm": 49.64610290527344, - "learning_rate": 3.3536890133773346e-06, - "loss": 0.3835, - "step": 45510 - }, - { - "epoch": 91.08, - "grad_norm": 44.39104080200195, - "learning_rate": 3.347757489142608e-06, - "loss": 0.4032, - "step": 45540 - }, - { - "epoch": 91.14, - "grad_norm": 108.25508880615234, - "learning_rate": 3.3418285740243285e-06, - "loss": 0.3498, - "step": 45570 - }, - { - "epoch": 91.2, - "grad_norm": 81.07303619384766, - "learning_rate": 3.3359022773850673e-06, - "loss": 0.3952, - "step": 45600 - }, - { - "epoch": 91.26, - "grad_norm": 55.850730895996094, - "learning_rate": 3.329978608583252e-06, - "loss": 0.4522, - "step": 45630 - }, - { - "epoch": 91.32, - "grad_norm": 60.0030632019043, - "learning_rate": 3.3240575769731662e-06, - "loss": 0.3706, - "step": 45660 - }, - { - "epoch": 91.38, - "grad_norm": 110.41849517822266, - "learning_rate": 3.3181391919049277e-06, - "loss": 0.434, - "step": 45690 - }, - { - "epoch": 91.44, - "grad_norm": 0.00027178472373634577, - "learning_rate": 3.312223462724472e-06, - "loss": 0.4455, - "step": 45720 - }, - { - "epoch": 91.5, - "grad_norm": 0.0003708788426592946, - "learning_rate": 3.3063103987735433e-06, - "loss": 0.3994, - "step": 45750 - }, - { - "epoch": 91.56, - "grad_norm": 34.135887145996094, - "learning_rate": 3.300400009389678e-06, - "loss": 0.5321, - "step": 45780 - }, - { - "epoch": 91.62, - "grad_norm": 190.13998413085938, - "learning_rate": 3.294492303906188e-06, - "loss": 0.3533, - "step": 45810 - }, - { - "epoch": 91.68, - "grad_norm": 44.5889892578125, - "learning_rate": 3.2885872916521445e-06, - "loss": 0.3205, - "step": 45840 - }, - { - "epoch": 91.74, - "grad_norm": 46.73158264160156, - "learning_rate": 3.282684981952369e-06, - "loss": 0.3406, - "step": 45870 - }, - { - "epoch": 91.8, - "grad_norm": 66.26206970214844, - "learning_rate": 3.2767853841274154e-06, - "loss": 0.3789, - "step": 45900 - }, - { - "epoch": 91.86, - "grad_norm": 108.49457550048828, - "learning_rate": 3.2708885074935515e-06, - "loss": 0.3897, - "step": 45930 - }, - { - "epoch": 91.92, - "grad_norm": 39.29719161987305, - "learning_rate": 3.264994361362753e-06, - "loss": 0.3295, - "step": 45960 - }, - { - "epoch": 91.98, - "grad_norm": 101.66162109375, - "learning_rate": 3.25910295504268e-06, - "loss": 0.3912, - "step": 45990 - }, - { - "epoch": 92.0, - "eval_loss": 0.32507237792015076, - "eval_map": 0.7654, - "eval_map_50": 0.9549, - "eval_map_75": 0.9026, - "eval_map_chicken": 0.7566, - "eval_map_duck": 0.7011, - "eval_map_large": 0.7949, - "eval_map_medium": 0.7613, - "eval_map_plant": 0.8385, - "eval_map_small": 0.239, - "eval_mar_1": 0.3052, - "eval_mar_10": 0.8083, - "eval_mar_100": 0.8145, - "eval_mar_100_chicken": 0.8115, - "eval_mar_100_duck": 0.7536, - "eval_mar_100_plant": 0.8785, - "eval_mar_large": 0.8352, - "eval_mar_medium": 0.81, - "eval_mar_small": 0.4105, - "eval_runtime": 12.6537, - "eval_samples_per_second": 7.903, - "eval_steps_per_second": 1.027, - "step": 46000 - }, - { - "epoch": 92.04, - "grad_norm": 44.84565734863281, - "learning_rate": 3.2532142978366654e-06, - "loss": 0.3629, - "step": 46020 - }, - { - "epoch": 92.1, - "grad_norm": 49.798702239990234, - "learning_rate": 3.247328399043706e-06, - "loss": 0.4384, - "step": 46050 - }, - { - "epoch": 92.16, - "grad_norm": 109.70671081542969, - "learning_rate": 3.241445267958438e-06, - "loss": 0.485, - "step": 46080 - }, - { - "epoch": 92.22, - "grad_norm": 39.21620559692383, - "learning_rate": 3.235564913871126e-06, - "loss": 0.3781, - "step": 46110 - }, - { - "epoch": 92.28, - "grad_norm": 134.4602508544922, - "learning_rate": 3.2296873460676557e-06, - "loss": 0.3406, - "step": 46140 - }, - { - "epoch": 92.34, - "grad_norm": 75.78138732910156, - "learning_rate": 3.2238125738295063e-06, - "loss": 0.3853, - "step": 46170 - }, - { - "epoch": 92.4, - "grad_norm": 223.64117431640625, - "learning_rate": 3.217940606433747e-06, - "loss": 0.363, - "step": 46200 - }, - { - "epoch": 92.46, - "grad_norm": 58.8635139465332, - "learning_rate": 3.212071453153015e-06, - "loss": 0.4155, - "step": 46230 - }, - { - "epoch": 92.52, - "grad_norm": 51.66313552856445, - "learning_rate": 3.2062051232555024e-06, - "loss": 0.3064, - "step": 46260 - }, - { - "epoch": 92.58, - "grad_norm": 37.06298065185547, - "learning_rate": 3.2003416260049493e-06, - "loss": 0.3651, - "step": 46290 - }, - { - "epoch": 92.64, - "grad_norm": 45.798763275146484, - "learning_rate": 3.1944809706606123e-06, - "loss": 0.501, - "step": 46320 - }, - { - "epoch": 92.7, - "grad_norm": 28.174030303955078, - "learning_rate": 3.188623166477272e-06, - "loss": 0.3911, - "step": 46350 - }, - { - "epoch": 92.76, - "grad_norm": 76.97637939453125, - "learning_rate": 3.182768222705198e-06, - "loss": 0.4013, - "step": 46380 - }, - { - "epoch": 92.82, - "grad_norm": 428.0056457519531, - "learning_rate": 3.1769161485901445e-06, - "loss": 0.3675, - "step": 46410 - }, - { - "epoch": 92.88, - "grad_norm": 51.109649658203125, - "learning_rate": 3.171066953373338e-06, - "loss": 0.4192, - "step": 46440 - }, - { - "epoch": 92.94, - "grad_norm": 8.084972068900242e-05, - "learning_rate": 3.1652206462914542e-06, - "loss": 0.2879, - "step": 46470 - }, - { - "epoch": 93.0, - "grad_norm": 68.58462524414062, - "learning_rate": 3.1593772365766107e-06, - "loss": 0.3807, - "step": 46500 - }, - { - "epoch": 93.0, - "eval_loss": 0.3134855329990387, - "eval_map": 0.775, - "eval_map_50": 0.9623, - "eval_map_75": 0.8789, - "eval_map_chicken": 0.7674, - "eval_map_duck": 0.7131, - "eval_map_large": 0.8012, - "eval_map_medium": 0.7761, - "eval_map_plant": 0.8444, - "eval_map_small": 0.3063, - "eval_mar_1": 0.3088, - "eval_mar_10": 0.8154, - "eval_mar_100": 0.822, - "eval_mar_100_chicken": 0.821, - "eval_mar_100_duck": 0.7608, - "eval_mar_100_plant": 0.8842, - "eval_mar_large": 0.845, - "eval_mar_medium": 0.8208, - "eval_mar_small": 0.4376, - "eval_runtime": 13.363, - "eval_samples_per_second": 7.483, - "eval_steps_per_second": 0.973, - "step": 46500 - }, - { - "epoch": 93.06, - "grad_norm": 171.59226989746094, - "learning_rate": 3.1535367334563493e-06, - "loss": 0.3706, - "step": 46530 - }, - { - "epoch": 93.12, - "grad_norm": 45.086509704589844, - "learning_rate": 3.147699146153621e-06, - "loss": 0.3423, - "step": 46560 - }, - { - "epoch": 93.18, - "grad_norm": 71.19178009033203, - "learning_rate": 3.141864483886774e-06, - "loss": 0.4562, - "step": 46590 - }, - { - "epoch": 93.24, - "grad_norm": 66.43144989013672, - "learning_rate": 3.1360327558695336e-06, - "loss": 0.3422, - "step": 46620 - }, - { - "epoch": 93.3, - "grad_norm": 65.01272583007812, - "learning_rate": 3.130203971310999e-06, - "loss": 0.3208, - "step": 46650 - }, - { - "epoch": 93.36, - "grad_norm": 26.024059295654297, - "learning_rate": 3.1243781394156138e-06, - "loss": 0.3998, - "step": 46680 - }, - { - "epoch": 93.42, - "grad_norm": 49.75782012939453, - "learning_rate": 3.1185552693831595e-06, - "loss": 0.3497, - "step": 46710 - }, - { - "epoch": 93.48, - "grad_norm": 41.48928451538086, - "learning_rate": 3.1127353704087477e-06, - "loss": 0.3313, - "step": 46740 - }, - { - "epoch": 93.54, - "grad_norm": 35.04191589355469, - "learning_rate": 3.106918451682789e-06, - "loss": 0.3986, - "step": 46770 - }, - { - "epoch": 93.6, - "grad_norm": 55.89842987060547, - "learning_rate": 3.1011045223909954e-06, - "loss": 0.3819, - "step": 46800 - }, - { - "epoch": 93.66, - "grad_norm": 68.73428344726562, - "learning_rate": 3.0952935917143533e-06, - "loss": 0.3833, - "step": 46830 - }, - { - "epoch": 93.72, - "grad_norm": 55.55575180053711, - "learning_rate": 3.089485668829113e-06, - "loss": 0.5715, - "step": 46860 - }, - { - "epoch": 93.78, - "grad_norm": 102.37735748291016, - "learning_rate": 3.0836807629067828e-06, - "loss": 0.3383, - "step": 46890 - }, - { - "epoch": 93.84, - "grad_norm": 157.2577667236328, - "learning_rate": 3.077878883114096e-06, - "loss": 0.3836, - "step": 46920 - }, - { - "epoch": 93.9, - "grad_norm": 38.29557418823242, - "learning_rate": 3.0720800386130176e-06, - "loss": 0.3645, - "step": 46950 - }, - { - "epoch": 93.96, - "grad_norm": 77.96990203857422, - "learning_rate": 3.066284238560713e-06, - "loss": 0.3656, - "step": 46980 - }, - { - "epoch": 94.0, - "eval_loss": 0.30864033102989197, - "eval_map": 0.7801, - "eval_map_50": 0.95, - "eval_map_75": 0.8789, - "eval_map_chicken": 0.7752, - "eval_map_duck": 0.726, - "eval_map_large": 0.8114, - "eval_map_medium": 0.7843, - "eval_map_plant": 0.8391, - "eval_map_small": 0.2709, - "eval_mar_1": 0.3144, - "eval_mar_10": 0.8184, - "eval_mar_100": 0.8227, - "eval_mar_100_chicken": 0.8238, - "eval_mar_100_duck": 0.766, - "eval_mar_100_plant": 0.8782, - "eval_mar_large": 0.8487, - "eval_mar_medium": 0.8282, - "eval_mar_small": 0.3586, - "eval_runtime": 13.7432, - "eval_samples_per_second": 7.276, - "eval_steps_per_second": 0.946, - "step": 47000 - }, - { - "epoch": 94.02, - "grad_norm": 40.90016555786133, - "learning_rate": 3.0604914921095373e-06, - "loss": 0.3862, - "step": 47010 - }, - { - "epoch": 94.08, - "grad_norm": 93.9953384399414, - "learning_rate": 3.0547018084070344e-06, - "loss": 0.4032, - "step": 47040 - }, - { - "epoch": 94.14, - "grad_norm": 52.626590728759766, - "learning_rate": 3.0489151965958998e-06, - "loss": 0.2954, - "step": 47070 - }, - { - "epoch": 94.2, - "grad_norm": 160.8077850341797, - "learning_rate": 3.043131665813988e-06, - "loss": 0.4525, - "step": 47100 - }, - { - "epoch": 94.26, - "grad_norm": 58.31721496582031, - "learning_rate": 3.0373512251942817e-06, - "loss": 0.3511, - "step": 47130 - }, - { - "epoch": 94.32, - "grad_norm": 43.910247802734375, - "learning_rate": 3.031573883864882e-06, - "loss": 0.3748, - "step": 47160 - }, - { - "epoch": 94.38, - "grad_norm": 113.1803970336914, - "learning_rate": 3.025799650949006e-06, - "loss": 0.3322, - "step": 47190 - }, - { - "epoch": 94.44, - "grad_norm": 168.05003356933594, - "learning_rate": 3.0200285355649504e-06, - "loss": 0.3997, - "step": 47220 - }, - { - "epoch": 94.5, - "grad_norm": 125.55654907226562, - "learning_rate": 3.0142605468260976e-06, - "loss": 0.4203, - "step": 47250 - }, - { - "epoch": 94.56, - "grad_norm": 64.3763427734375, - "learning_rate": 3.0084956938408873e-06, - "loss": 0.3918, - "step": 47280 - }, - { - "epoch": 94.62, - "grad_norm": 71.17652893066406, - "learning_rate": 3.002733985712808e-06, - "loss": 0.3435, - "step": 47310 - }, - { - "epoch": 94.68, - "grad_norm": 56.69123840332031, - "learning_rate": 2.9969754315403865e-06, - "loss": 0.4095, - "step": 47340 - }, - { - "epoch": 94.74, - "grad_norm": 49.36955261230469, - "learning_rate": 2.991220040417162e-06, - "loss": 0.3498, - "step": 47370 - }, - { - "epoch": 94.8, - "grad_norm": 8.323022484546527e-05, - "learning_rate": 2.9854678214316875e-06, - "loss": 0.3168, - "step": 47400 - }, - { - "epoch": 94.86, - "grad_norm": 96.6518325805664, - "learning_rate": 2.979718783667499e-06, - "loss": 0.4719, - "step": 47430 - }, - { - "epoch": 94.92, - "grad_norm": 39.4531364440918, - "learning_rate": 2.97397293620311e-06, - "loss": 0.3919, - "step": 47460 - }, - { - "epoch": 94.98, - "grad_norm": 50.0933837890625, - "learning_rate": 2.968230288112002e-06, - "loss": 0.4247, - "step": 47490 - }, - { - "epoch": 95.0, - "eval_loss": 0.31141915917396545, - "eval_map": 0.7796, - "eval_map_50": 0.9586, - "eval_map_75": 0.8881, - "eval_map_chicken": 0.7644, - "eval_map_duck": 0.7272, - "eval_map_large": 0.7972, - "eval_map_medium": 0.7744, - "eval_map_plant": 0.8473, - "eval_map_small": 0.3308, - "eval_mar_1": 0.3095, - "eval_mar_10": 0.8172, - "eval_mar_100": 0.8224, - "eval_mar_100_chicken": 0.8135, - "eval_mar_100_duck": 0.7701, - "eval_mar_100_plant": 0.8836, - "eval_mar_large": 0.8408, - "eval_mar_medium": 0.8143, - "eval_mar_small": 0.4505, - "eval_runtime": 13.2979, - "eval_samples_per_second": 7.52, - "eval_steps_per_second": 0.978, - "step": 47500 - }, - { - "epoch": 95.04, - "grad_norm": 17.76614761352539, - "learning_rate": 2.962490848462596e-06, - "loss": 0.2925, - "step": 47520 - }, - { - "epoch": 95.1, - "grad_norm": 68.24947357177734, - "learning_rate": 2.9567546263182554e-06, - "loss": 0.3557, - "step": 47550 - }, - { - "epoch": 95.16, - "grad_norm": 30.662485122680664, - "learning_rate": 2.951021630737255e-06, - "loss": 0.3694, - "step": 47580 - }, - { - "epoch": 95.22, - "grad_norm": 31.896482467651367, - "learning_rate": 2.945291870772776e-06, - "loss": 0.5909, - "step": 47610 - }, - { - "epoch": 95.28, - "grad_norm": 43.45343017578125, - "learning_rate": 2.9395653554728955e-06, - "loss": 0.3929, - "step": 47640 - }, - { - "epoch": 95.34, - "grad_norm": 49.6175537109375, - "learning_rate": 2.933842093880558e-06, - "loss": 0.4409, - "step": 47670 - }, - { - "epoch": 95.4, - "grad_norm": 34.212284088134766, - "learning_rate": 2.92812209503358e-06, - "loss": 0.3825, - "step": 47700 - }, - { - "epoch": 95.46, - "grad_norm": 45.17938232421875, - "learning_rate": 2.922405367964617e-06, - "loss": 0.347, - "step": 47730 - }, - { - "epoch": 95.52, - "grad_norm": 73.44324493408203, - "learning_rate": 2.91669192170116e-06, - "loss": 0.2972, - "step": 47760 - }, - { - "epoch": 95.58, - "grad_norm": 296.8179931640625, - "learning_rate": 2.9109817652655253e-06, - "loss": 0.401, - "step": 47790 - }, - { - "epoch": 95.64, - "grad_norm": 59.57863235473633, - "learning_rate": 2.9052749076748266e-06, - "loss": 0.4201, - "step": 47820 - }, - { - "epoch": 95.7, - "grad_norm": 79.73772430419922, - "learning_rate": 2.899571357940969e-06, - "loss": 0.3687, - "step": 47850 - }, - { - "epoch": 95.76, - "grad_norm": 78.04991912841797, - "learning_rate": 2.8938711250706397e-06, - "loss": 0.399, - "step": 47880 - }, - { - "epoch": 95.82, - "grad_norm": 138.978515625, - "learning_rate": 2.8881742180652813e-06, - "loss": 0.4855, - "step": 47910 - }, - { - "epoch": 95.88, - "grad_norm": 73.97747802734375, - "learning_rate": 2.8824806459210907e-06, - "loss": 0.3487, - "step": 47940 - }, - { - "epoch": 95.94, - "grad_norm": 44.751983642578125, - "learning_rate": 2.876790417628994e-06, - "loss": 0.327, - "step": 47970 - }, - { - "epoch": 96.0, - "grad_norm": 63.331268310546875, - "learning_rate": 2.871103542174637e-06, - "loss": 0.4126, - "step": 48000 - }, - { - "epoch": 96.0, - "eval_loss": 0.31334859132766724, - "eval_map": 0.7738, - "eval_map_50": 0.9614, - "eval_map_75": 0.8988, - "eval_map_chicken": 0.7608, - "eval_map_duck": 0.7137, - "eval_map_large": 0.8021, - "eval_map_medium": 0.7708, - "eval_map_plant": 0.8468, - "eval_map_small": 0.3127, - "eval_mar_1": 0.31, - "eval_mar_10": 0.8124, - "eval_mar_100": 0.8185, - "eval_mar_100_chicken": 0.8087, - "eval_mar_100_duck": 0.7629, - "eval_mar_100_plant": 0.8839, - "eval_mar_large": 0.842, - "eval_mar_medium": 0.8166, - "eval_mar_small": 0.3962, - "eval_runtime": 12.9212, - "eval_samples_per_second": 7.739, - "eval_steps_per_second": 1.006, - "step": 48000 - }, - { - "epoch": 96.06, - "grad_norm": 186.40716552734375, - "learning_rate": 2.865420028538375e-06, - "loss": 0.4059, - "step": 48030 - }, - { - "epoch": 96.12, - "grad_norm": 0.00018756429199129343, - "learning_rate": 2.8597398856952473e-06, - "loss": 0.3349, - "step": 48060 - }, - { - "epoch": 96.18, - "grad_norm": 90.84541320800781, - "learning_rate": 2.8540631226149813e-06, - "loss": 0.3498, - "step": 48090 - }, - { - "epoch": 96.24, - "grad_norm": 58.350582122802734, - "learning_rate": 2.8483897482619566e-06, - "loss": 0.4473, - "step": 48120 - }, - { - "epoch": 96.3, - "grad_norm": 31.49554443359375, - "learning_rate": 2.8427197715952047e-06, - "loss": 0.3953, - "step": 48150 - }, - { - "epoch": 96.36, - "grad_norm": 61.373722076416016, - "learning_rate": 2.837053201568396e-06, - "loss": 0.409, - "step": 48180 - }, - { - "epoch": 96.42, - "grad_norm": 66.46263885498047, - "learning_rate": 2.831390047129815e-06, - "loss": 0.3796, - "step": 48210 - }, - { - "epoch": 96.48, - "grad_norm": 53.44883728027344, - "learning_rate": 2.825730317222358e-06, - "loss": 0.4266, - "step": 48240 - }, - { - "epoch": 96.54, - "grad_norm": 73.42400360107422, - "learning_rate": 2.820074020783511e-06, - "loss": 0.396, - "step": 48270 - }, - { - "epoch": 96.6, - "grad_norm": 37.24607849121094, - "learning_rate": 2.814421166745337e-06, - "loss": 0.335, - "step": 48300 - }, - { - "epoch": 96.66, - "grad_norm": 89.07501220703125, - "learning_rate": 2.808771764034462e-06, - "loss": 0.4008, - "step": 48330 - }, - { - "epoch": 96.72, - "grad_norm": 51.42045211791992, - "learning_rate": 2.803125821572068e-06, - "loss": 0.4745, - "step": 48360 - }, - { - "epoch": 96.78, - "grad_norm": 133.7329864501953, - "learning_rate": 2.7974833482738674e-06, - "loss": 0.4058, - "step": 48390 - }, - { - "epoch": 96.84, - "grad_norm": 48.37213897705078, - "learning_rate": 2.791844353050094e-06, - "loss": 0.3529, - "step": 48420 - }, - { - "epoch": 96.9, - "grad_norm": 72.90308380126953, - "learning_rate": 2.7862088448054936e-06, - "loss": 0.3712, - "step": 48450 - }, - { - "epoch": 96.96, - "grad_norm": 29.49749183654785, - "learning_rate": 2.7805768324393017e-06, - "loss": 0.359, - "step": 48480 - }, - { - "epoch": 97.0, - "eval_loss": 0.32005390524864197, - "eval_map": 0.7733, - "eval_map_50": 0.953, - "eval_map_75": 0.906, - "eval_map_chicken": 0.7506, - "eval_map_duck": 0.7168, - "eval_map_large": 0.8001, - "eval_map_medium": 0.7727, - "eval_map_plant": 0.8526, - "eval_map_small": 0.3088, - "eval_mar_1": 0.3107, - "eval_mar_10": 0.81, - "eval_mar_100": 0.8155, - "eval_mar_100_chicken": 0.7964, - "eval_mar_100_duck": 0.7629, - "eval_mar_100_plant": 0.8873, - "eval_mar_large": 0.8409, - "eval_mar_medium": 0.8137, - "eval_mar_small": 0.391, - "eval_runtime": 14.4958, - "eval_samples_per_second": 6.899, - "eval_steps_per_second": 0.897, - "step": 48500 - }, - { - "epoch": 97.02, - "grad_norm": 60.98162078857422, - "learning_rate": 2.7749483248452324e-06, - "loss": 0.3565, - "step": 48510 - }, - { - "epoch": 97.08, - "grad_norm": 46.7698860168457, - "learning_rate": 2.769323330911472e-06, - "loss": 0.4409, - "step": 48540 - }, - { - "epoch": 97.14, - "grad_norm": 88.60187530517578, - "learning_rate": 2.763701859520652e-06, - "loss": 0.3511, - "step": 48570 - }, - { - "epoch": 97.2, - "grad_norm": 43.76838302612305, - "learning_rate": 2.7580839195498397e-06, - "loss": 0.3706, - "step": 48600 - }, - { - "epoch": 97.26, - "grad_norm": 65.14667510986328, - "learning_rate": 2.752469519870534e-06, - "loss": 0.3971, - "step": 48630 - }, - { - "epoch": 97.32, - "grad_norm": 62.264827728271484, - "learning_rate": 2.746858669348634e-06, - "loss": 0.3478, - "step": 48660 - }, - { - "epoch": 97.38, - "grad_norm": 28.317747116088867, - "learning_rate": 2.741251376844443e-06, - "loss": 0.3369, - "step": 48690 - }, - { - "epoch": 97.44, - "grad_norm": 50.689430236816406, - "learning_rate": 2.7356476512126386e-06, - "loss": 0.3473, - "step": 48720 - }, - { - "epoch": 97.5, - "grad_norm": 96.586181640625, - "learning_rate": 2.7300475013022666e-06, - "loss": 0.3622, - "step": 48750 - }, - { - "epoch": 97.56, - "grad_norm": 84.39799499511719, - "learning_rate": 2.724450935956733e-06, - "loss": 0.3246, - "step": 48780 - }, - { - "epoch": 97.62, - "grad_norm": 83.29969024658203, - "learning_rate": 2.718857964013773e-06, - "loss": 0.3915, - "step": 48810 - }, - { - "epoch": 97.68, - "grad_norm": 26.59626579284668, - "learning_rate": 2.713268594305458e-06, - "loss": 0.3597, - "step": 48840 - }, - { - "epoch": 97.74, - "grad_norm": 54.20785903930664, - "learning_rate": 2.707682835658163e-06, - "loss": 0.3688, - "step": 48870 - }, - { - "epoch": 97.8, - "grad_norm": 126.53070068359375, - "learning_rate": 2.7021006968925613e-06, - "loss": 0.3818, - "step": 48900 - }, - { - "epoch": 97.86, - "grad_norm": 0.0017745899967849255, - "learning_rate": 2.6965221868236156e-06, - "loss": 0.3398, - "step": 48930 - }, - { - "epoch": 97.92, - "grad_norm": 118.43617248535156, - "learning_rate": 2.6909473142605522e-06, - "loss": 0.3898, - "step": 48960 - }, - { - "epoch": 97.98, - "grad_norm": 61.02579879760742, - "learning_rate": 2.6853760880068587e-06, - "loss": 0.4638, - "step": 48990 - }, - { - "epoch": 98.0, - "eval_loss": 0.3107198178768158, - "eval_map": 0.782, - "eval_map_50": 0.9587, - "eval_map_75": 0.887, - "eval_map_chicken": 0.7726, - "eval_map_duck": 0.7132, - "eval_map_large": 0.8032, - "eval_map_medium": 0.783, - "eval_map_plant": 0.8601, - "eval_map_small": 0.3189, - "eval_mar_1": 0.3128, - "eval_mar_10": 0.8212, - "eval_mar_100": 0.8258, - "eval_mar_100_chicken": 0.8147, - "eval_mar_100_duck": 0.767, - "eval_mar_100_plant": 0.8958, - "eval_mar_large": 0.8441, - "eval_mar_medium": 0.8258, - "eval_mar_small": 0.3933, - "eval_runtime": 14.1225, - "eval_samples_per_second": 7.081, - "eval_steps_per_second": 0.921, - "step": 49000 - }, - { - "epoch": 98.04, - "grad_norm": 21.68953514099121, - "learning_rate": 2.6798085168602595e-06, - "loss": 0.5093, - "step": 49020 - }, - { - "epoch": 98.1, - "grad_norm": 57.37543487548828, - "learning_rate": 2.6742446096127086e-06, - "loss": 0.3139, - "step": 49050 - }, - { - "epoch": 98.16, - "grad_norm": 77.86444091796875, - "learning_rate": 2.668684375050378e-06, - "loss": 0.4126, - "step": 49080 - }, - { - "epoch": 98.22, - "grad_norm": 66.2899169921875, - "learning_rate": 2.663127821953633e-06, - "loss": 0.3734, - "step": 49110 - }, - { - "epoch": 98.28, - "grad_norm": 53.63509750366211, - "learning_rate": 2.6575749590970336e-06, - "loss": 0.3579, - "step": 49140 - }, - { - "epoch": 98.34, - "grad_norm": 38.823856353759766, - "learning_rate": 2.6520257952493066e-06, - "loss": 0.4116, - "step": 49170 - }, - { - "epoch": 98.4, - "grad_norm": 63.37985610961914, - "learning_rate": 2.646480339173337e-06, - "loss": 0.3824, - "step": 49200 - }, - { - "epoch": 98.46, - "grad_norm": 38.528717041015625, - "learning_rate": 2.6409385996261606e-06, - "loss": 0.3395, - "step": 49230 - }, - { - "epoch": 98.52, - "grad_norm": 60.49711990356445, - "learning_rate": 2.635400585358937e-06, - "loss": 0.3363, - "step": 49260 - }, - { - "epoch": 98.58, - "grad_norm": 59.21797561645508, - "learning_rate": 2.62986630511695e-06, - "loss": 0.4574, - "step": 49290 - }, - { - "epoch": 98.64, - "grad_norm": 58.201622009277344, - "learning_rate": 2.624335767639582e-06, - "loss": 0.5018, - "step": 49320 - }, - { - "epoch": 98.7, - "grad_norm": 54.895503997802734, - "learning_rate": 2.618808981660304e-06, - "loss": 0.3094, - "step": 49350 - }, - { - "epoch": 98.76, - "grad_norm": 67.75933837890625, - "learning_rate": 2.6132859559066704e-06, - "loss": 0.4307, - "step": 49380 - }, - { - "epoch": 98.82, - "grad_norm": 55.180294036865234, - "learning_rate": 2.607766699100288e-06, - "loss": 0.382, - "step": 49410 - }, - { - "epoch": 98.88, - "grad_norm": 81.35394287109375, - "learning_rate": 2.6022512199568205e-06, - "loss": 0.3102, - "step": 49440 - }, - { - "epoch": 98.94, - "grad_norm": 43.163002014160156, - "learning_rate": 2.5967395271859614e-06, - "loss": 0.4086, - "step": 49470 - }, - { - "epoch": 99.0, - "grad_norm": 65.92552947998047, - "learning_rate": 2.5912316294914232e-06, - "loss": 0.3504, - "step": 49500 - }, - { - "epoch": 99.0, - "eval_loss": 0.30719977617263794, - "eval_map": 0.7808, - "eval_map_50": 0.9538, - "eval_map_75": 0.9073, - "eval_map_chicken": 0.7752, - "eval_map_duck": 0.7103, - "eval_map_large": 0.8113, - "eval_map_medium": 0.7827, - "eval_map_plant": 0.8571, - "eval_map_small": 0.3213, - "eval_mar_1": 0.3134, - "eval_mar_10": 0.8181, - "eval_mar_100": 0.823, - "eval_mar_100_chicken": 0.823, - "eval_mar_100_duck": 0.7546, - "eval_mar_100_plant": 0.8912, - "eval_mar_large": 0.8499, - "eval_mar_medium": 0.8219, - "eval_mar_small": 0.4033, - "eval_runtime": 14.3241, - "eval_samples_per_second": 6.981, - "eval_steps_per_second": 0.908, - "step": 49500 - }, - { - "epoch": 99.06, - "grad_norm": 62.5239143371582, - "learning_rate": 2.5857275355709317e-06, - "loss": 0.3715, - "step": 49530 - }, - { - "epoch": 99.12, - "grad_norm": 88.1968765258789, - "learning_rate": 2.580227254116199e-06, - "loss": 0.4106, - "step": 49560 - }, - { - "epoch": 99.18, - "grad_norm": 91.27246856689453, - "learning_rate": 2.5747307938129245e-06, - "loss": 0.4021, - "step": 49590 - }, - { - "epoch": 99.24, - "grad_norm": 45.90950012207031, - "learning_rate": 2.5692381633407672e-06, - "loss": 0.3523, - "step": 49620 - }, - { - "epoch": 99.3, - "grad_norm": 34.13705062866211, - "learning_rate": 2.5637493713733376e-06, - "loss": 0.4114, - "step": 49650 - }, - { - "epoch": 99.36, - "grad_norm": 84.46089172363281, - "learning_rate": 2.558264426578192e-06, - "loss": 0.334, - "step": 49680 - }, - { - "epoch": 99.42, - "grad_norm": 58.19248580932617, - "learning_rate": 2.5527833376168055e-06, - "loss": 0.3926, - "step": 49710 - }, - { - "epoch": 99.48, - "grad_norm": 61.39611053466797, - "learning_rate": 2.547306113144564e-06, - "loss": 0.3741, - "step": 49740 - }, - { - "epoch": 99.54, - "grad_norm": 48.98357391357422, - "learning_rate": 2.541832761810753e-06, - "loss": 0.4374, - "step": 49770 - }, - { - "epoch": 99.6, - "grad_norm": 39.02640151977539, - "learning_rate": 2.536363292258543e-06, - "loss": 0.3768, - "step": 49800 - }, - { - "epoch": 99.66, - "grad_norm": 80.49829864501953, - "learning_rate": 2.5308977131249724e-06, - "loss": 0.3107, - "step": 49830 - }, - { - "epoch": 99.72, - "grad_norm": 91.48433685302734, - "learning_rate": 2.5254360330409343e-06, - "loss": 0.3672, - "step": 49860 - }, - { - "epoch": 99.78, - "grad_norm": 97.91492462158203, - "learning_rate": 2.5199782606311708e-06, - "loss": 0.3564, - "step": 49890 - }, - { - "epoch": 99.84, - "grad_norm": 56.21559524536133, - "learning_rate": 2.514524404514248e-06, - "loss": 0.388, - "step": 49920 - }, - { - "epoch": 99.9, - "grad_norm": 66.36531829833984, - "learning_rate": 2.509074473302546e-06, - "loss": 0.4225, - "step": 49950 - }, - { - "epoch": 99.96, - "grad_norm": 40.85894775390625, - "learning_rate": 2.503628475602256e-06, - "loss": 0.4122, - "step": 49980 - }, - { - "epoch": 100.0, - "eval_loss": 0.30709704756736755, - "eval_map": 0.7832, - "eval_map_50": 0.9591, - "eval_map_75": 0.9103, - "eval_map_chicken": 0.7704, - "eval_map_duck": 0.7221, - "eval_map_large": 0.7982, - "eval_map_medium": 0.7866, - "eval_map_plant": 0.8572, - "eval_map_small": 0.3515, - "eval_mar_1": 0.3125, - "eval_mar_10": 0.8203, - "eval_mar_100": 0.8259, - "eval_mar_100_chicken": 0.8179, - "eval_mar_100_duck": 0.7691, - "eval_mar_100_plant": 0.8909, - "eval_mar_large": 0.8408, - "eval_mar_medium": 0.8275, - "eval_mar_small": 0.4233, - "eval_runtime": 12.7791, - "eval_samples_per_second": 7.825, - "eval_steps_per_second": 1.017, - "step": 50000 - }, - { - "epoch": 100.02, - "grad_norm": 33.76742935180664, - "learning_rate": 2.4981864200133483e-06, - "loss": 0.3851, - "step": 50010 - }, - { - "epoch": 100.08, - "grad_norm": 90.33648681640625, - "learning_rate": 2.49274831512957e-06, - "loss": 0.3643, - "step": 50040 - }, - { - "epoch": 100.14, - "grad_norm": 27.876367568969727, - "learning_rate": 2.4873141695384346e-06, - "loss": 0.3785, - "step": 50070 - }, - { - "epoch": 100.2, - "grad_norm": 68.729736328125, - "learning_rate": 2.4818839918211963e-06, - "loss": 0.3525, - "step": 50100 - }, - { - "epoch": 100.26, - "grad_norm": 67.7789077758789, - "learning_rate": 2.4764577905528503e-06, - "loss": 0.3952, - "step": 50130 - }, - { - "epoch": 100.32, - "grad_norm": 29.81199836730957, - "learning_rate": 2.4710355743021077e-06, - "loss": 0.3813, - "step": 50160 - }, - { - "epoch": 100.38, - "grad_norm": 30.434463500976562, - "learning_rate": 2.4656173516313852e-06, - "loss": 0.4306, - "step": 50190 - }, - { - "epoch": 100.44, - "grad_norm": 41.9581298828125, - "learning_rate": 2.4602031310968013e-06, - "loss": 0.4288, - "step": 50220 - }, - { - "epoch": 100.5, - "grad_norm": 0.0003115141298621893, - "learning_rate": 2.4547929212481436e-06, - "loss": 0.3373, - "step": 50250 - }, - { - "epoch": 100.56, - "grad_norm": 40.25923538208008, - "learning_rate": 2.4493867306288772e-06, - "loss": 0.2919, - "step": 50280 - }, - { - "epoch": 100.62, - "grad_norm": 31.388107299804688, - "learning_rate": 2.4439845677761124e-06, - "loss": 0.4041, - "step": 50310 - }, - { - "epoch": 100.68, - "grad_norm": 54.791481018066406, - "learning_rate": 2.4385864412206e-06, - "loss": 0.4319, - "step": 50340 - }, - { - "epoch": 100.74, - "grad_norm": 111.72852325439453, - "learning_rate": 2.433192359486723e-06, - "loss": 0.3565, - "step": 50370 - }, - { - "epoch": 100.8, - "grad_norm": 179.5271453857422, - "learning_rate": 2.4278023310924676e-06, - "loss": 0.3688, - "step": 50400 - }, - { - "epoch": 100.86, - "grad_norm": 61.95014190673828, - "learning_rate": 2.422416364549429e-06, - "loss": 0.3575, - "step": 50430 - }, - { - "epoch": 100.92, - "grad_norm": 51.592926025390625, - "learning_rate": 2.417034468362782e-06, - "loss": 0.4289, - "step": 50460 - }, - { - "epoch": 100.98, - "grad_norm": 48.83248519897461, - "learning_rate": 2.4116566510312734e-06, - "loss": 0.4066, - "step": 50490 - }, - { - "epoch": 101.0, - "eval_loss": 0.3090997338294983, - "eval_map": 0.7845, - "eval_map_50": 0.9595, - "eval_map_75": 0.8987, - "eval_map_chicken": 0.7781, - "eval_map_duck": 0.7198, - "eval_map_large": 0.8005, - "eval_map_medium": 0.7879, - "eval_map_plant": 0.8555, - "eval_map_small": 0.3408, - "eval_mar_1": 0.3126, - "eval_mar_10": 0.82, - "eval_mar_100": 0.8259, - "eval_mar_100_chicken": 0.823, - "eval_mar_100_duck": 0.7649, - "eval_mar_100_plant": 0.8897, - "eval_mar_large": 0.8379, - "eval_mar_medium": 0.826, - "eval_mar_small": 0.4086, - "eval_runtime": 12.157, - "eval_samples_per_second": 8.226, - "eval_steps_per_second": 1.069, - "step": 50500 - }, - { - "epoch": 101.04, - "grad_norm": 83.6888656616211, - "learning_rate": 2.406282921047213e-06, - "loss": 0.364, - "step": 50520 - }, - { - "epoch": 101.1, - "grad_norm": 46.9664192199707, - "learning_rate": 2.4009132868964525e-06, - "loss": 0.3907, - "step": 50550 - }, - { - "epoch": 101.16, - "grad_norm": 49.857032775878906, - "learning_rate": 2.395547757058379e-06, - "loss": 0.4456, - "step": 50580 - }, - { - "epoch": 101.22, - "grad_norm": 65.27449798583984, - "learning_rate": 2.3901863400058954e-06, - "loss": 0.4042, - "step": 50610 - }, - { - "epoch": 101.28, - "grad_norm": 48.69483947753906, - "learning_rate": 2.3848290442054096e-06, - "loss": 0.3632, - "step": 50640 - }, - { - "epoch": 101.34, - "grad_norm": 0.0001556992210680619, - "learning_rate": 2.379475878116826e-06, - "loss": 0.3668, - "step": 50670 - }, - { - "epoch": 101.4, - "grad_norm": 53.774532318115234, - "learning_rate": 2.3741268501935212e-06, - "loss": 0.3668, - "step": 50700 - }, - { - "epoch": 101.46, - "grad_norm": 38.233299255371094, - "learning_rate": 2.368781968882343e-06, - "loss": 0.3889, - "step": 50730 - }, - { - "epoch": 101.52, - "grad_norm": 135.56581115722656, - "learning_rate": 2.3634412426235886e-06, - "loss": 0.3349, - "step": 50760 - }, - { - "epoch": 101.58, - "grad_norm": 35.401832580566406, - "learning_rate": 2.358104679850991e-06, - "loss": 0.3918, - "step": 50790 - }, - { - "epoch": 101.64, - "grad_norm": 75.53800201416016, - "learning_rate": 2.3527722889917147e-06, - "loss": 0.3939, - "step": 50820 - }, - { - "epoch": 101.7, - "grad_norm": 66.56050109863281, - "learning_rate": 2.3474440784663287e-06, - "loss": 0.3925, - "step": 50850 - }, - { - "epoch": 101.76, - "grad_norm": 55.19369125366211, - "learning_rate": 2.3421200566888096e-06, - "loss": 0.3704, - "step": 50880 - }, - { - "epoch": 101.82, - "grad_norm": 31.786827087402344, - "learning_rate": 2.3368002320665118e-06, - "loss": 0.4129, - "step": 50910 - }, - { - "epoch": 101.88, - "grad_norm": 45.33772277832031, - "learning_rate": 2.3314846130001622e-06, - "loss": 0.3603, - "step": 50940 - }, - { - "epoch": 101.94, - "grad_norm": 169.04415893554688, - "learning_rate": 2.326173207883854e-06, - "loss": 0.3808, - "step": 50970 - }, - { - "epoch": 102.0, - "grad_norm": 85.23856353759766, - "learning_rate": 2.320866025105016e-06, - "loss": 0.3207, - "step": 51000 - }, - { - "epoch": 102.0, - "eval_loss": 0.312703400850296, - "eval_map": 0.7783, - "eval_map_50": 0.9531, - "eval_map_75": 0.8992, - "eval_map_chicken": 0.7715, - "eval_map_duck": 0.7081, - "eval_map_large": 0.8049, - "eval_map_medium": 0.7782, - "eval_map_plant": 0.8555, - "eval_map_small": 0.3268, - "eval_mar_1": 0.312, - "eval_mar_10": 0.8201, - "eval_mar_100": 0.8238, - "eval_mar_100_chicken": 0.8198, - "eval_mar_100_duck": 0.7588, - "eval_mar_100_plant": 0.8927, - "eval_mar_large": 0.8476, - "eval_mar_medium": 0.8221, - "eval_mar_small": 0.4262, - "eval_runtime": 11.5117, - "eval_samples_per_second": 8.687, - "eval_steps_per_second": 1.129, - "step": 51000 - }, - { - "epoch": 102.06, - "grad_norm": 46.077938079833984, - "learning_rate": 2.3155630730444185e-06, - "loss": 0.4213, - "step": 51030 - }, - { - "epoch": 102.12, - "grad_norm": 94.91500091552734, - "learning_rate": 2.3102643600761445e-06, - "loss": 0.3484, - "step": 51060 - }, - { - "epoch": 102.18, - "grad_norm": 52.73749923706055, - "learning_rate": 2.3049698945675826e-06, - "loss": 0.5028, - "step": 51090 - }, - { - "epoch": 102.24, - "grad_norm": 63.331214904785156, - "learning_rate": 2.299679684879421e-06, - "loss": 0.3526, - "step": 51120 - }, - { - "epoch": 102.3, - "grad_norm": 97.68816375732422, - "learning_rate": 2.294393739365621e-06, - "loss": 0.359, - "step": 51150 - }, - { - "epoch": 102.36, - "grad_norm": 54.449188232421875, - "learning_rate": 2.289112066373411e-06, - "loss": 0.3525, - "step": 51180 - }, - { - "epoch": 102.42, - "grad_norm": 0.00014486142026726156, - "learning_rate": 2.2838346742432753e-06, - "loss": 0.32, - "step": 51210 - }, - { - "epoch": 102.48, - "grad_norm": 45.01613235473633, - "learning_rate": 2.2785615713089363e-06, - "loss": 0.3813, - "step": 51240 - }, - { - "epoch": 102.54, - "grad_norm": 46.19170379638672, - "learning_rate": 2.2732927658973427e-06, - "loss": 0.4768, - "step": 51270 - }, - { - "epoch": 102.6, - "grad_norm": 112.9385757446289, - "learning_rate": 2.268028266328655e-06, - "loss": 0.391, - "step": 51300 - }, - { - "epoch": 102.66, - "grad_norm": 47.39128112792969, - "learning_rate": 2.262768080916241e-06, - "loss": 0.4029, - "step": 51330 - }, - { - "epoch": 102.72, - "grad_norm": 42.99913024902344, - "learning_rate": 2.25751221796665e-06, - "loss": 0.3401, - "step": 51360 - }, - { - "epoch": 102.78, - "grad_norm": 0.0027169722598046064, - "learning_rate": 2.2522606857796036e-06, - "loss": 0.3397, - "step": 51390 - }, - { - "epoch": 102.84, - "grad_norm": 58.7538948059082, - "learning_rate": 2.247013492647994e-06, - "loss": 0.4043, - "step": 51420 - }, - { - "epoch": 102.9, - "grad_norm": 48.809879302978516, - "learning_rate": 2.2417706468578495e-06, - "loss": 0.3294, - "step": 51450 - }, - { - "epoch": 102.96, - "grad_norm": 62.58914566040039, - "learning_rate": 2.2365321566883437e-06, - "loss": 0.3462, - "step": 51480 - }, - { - "epoch": 103.0, - "eval_loss": 0.3051559329032898, - "eval_map": 0.7911, - "eval_map_50": 0.957, - "eval_map_75": 0.9074, - "eval_map_chicken": 0.7746, - "eval_map_duck": 0.7385, - "eval_map_large": 0.8058, - "eval_map_medium": 0.7945, - "eval_map_plant": 0.8601, - "eval_map_small": 0.3095, - "eval_mar_1": 0.3146, - "eval_mar_10": 0.8252, - "eval_mar_100": 0.83, - "eval_mar_100_chicken": 0.8194, - "eval_mar_100_duck": 0.7763, - "eval_mar_100_plant": 0.8942, - "eval_mar_large": 0.8423, - "eval_mar_medium": 0.8332, - "eval_mar_small": 0.41, - "eval_runtime": 12.9597, - "eval_samples_per_second": 7.716, - "eval_steps_per_second": 1.003, - "step": 51500 - }, - { - "epoch": 103.02, - "grad_norm": 41.60489273071289, - "learning_rate": 2.2312980304117656e-06, - "loss": 0.4564, - "step": 51510 - }, - { - "epoch": 103.08, - "grad_norm": 52.09795379638672, - "learning_rate": 2.2260682762935137e-06, - "loss": 0.3348, - "step": 51540 - }, - { - "epoch": 103.14, - "grad_norm": 35.459171295166016, - "learning_rate": 2.220842902592087e-06, - "loss": 0.318, - "step": 51570 - }, - { - "epoch": 103.2, - "grad_norm": 56.90756607055664, - "learning_rate": 2.2156219175590623e-06, - "loss": 0.3904, - "step": 51600 - }, - { - "epoch": 103.26, - "grad_norm": 253.49964904785156, - "learning_rate": 2.2104053294390847e-06, - "loss": 0.3861, - "step": 51630 - }, - { - "epoch": 103.32, - "grad_norm": 114.14154052734375, - "learning_rate": 2.2051931464698636e-06, - "loss": 0.3613, - "step": 51660 - }, - { - "epoch": 103.38, - "grad_norm": 70.50907135009766, - "learning_rate": 2.1999853768821433e-06, - "loss": 0.4526, - "step": 51690 - }, - { - "epoch": 103.44, - "grad_norm": 31.685640335083008, - "learning_rate": 2.1947820288997067e-06, - "loss": 0.3307, - "step": 51720 - }, - { - "epoch": 103.5, - "grad_norm": 83.51459503173828, - "learning_rate": 2.1895831107393485e-06, - "loss": 0.3688, - "step": 51750 - }, - { - "epoch": 103.56, - "grad_norm": 94.39881134033203, - "learning_rate": 2.1843886306108686e-06, - "loss": 0.3543, - "step": 51780 - }, - { - "epoch": 103.62, - "grad_norm": 0.00011255555727984756, - "learning_rate": 2.179198596717063e-06, - "loss": 0.3212, - "step": 51810 - }, - { - "epoch": 103.68, - "grad_norm": 64.85936737060547, - "learning_rate": 2.174013017253701e-06, - "loss": 0.3276, - "step": 51840 - }, - { - "epoch": 103.74, - "grad_norm": 117.15434265136719, - "learning_rate": 2.168831900409523e-06, - "loss": 0.3798, - "step": 51870 - }, - { - "epoch": 103.8, - "grad_norm": 72.23023986816406, - "learning_rate": 2.1636552543662187e-06, - "loss": 0.3488, - "step": 51900 - }, - { - "epoch": 103.86, - "grad_norm": 49.46271514892578, - "learning_rate": 2.158483087298417e-06, - "loss": 0.3513, - "step": 51930 - }, - { - "epoch": 103.92, - "grad_norm": 105.83992767333984, - "learning_rate": 2.153315407373679e-06, - "loss": 0.3863, - "step": 51960 - }, - { - "epoch": 103.98, - "grad_norm": 69.60438537597656, - "learning_rate": 2.1481522227524725e-06, - "loss": 0.3938, - "step": 51990 - }, - { - "epoch": 104.0, - "eval_loss": 0.29546305537223816, - "eval_map": 0.793, - "eval_map_50": 0.9638, - "eval_map_75": 0.9043, - "eval_map_chicken": 0.7777, - "eval_map_duck": 0.7434, - "eval_map_large": 0.8019, - "eval_map_medium": 0.7971, - "eval_map_plant": 0.858, - "eval_map_small": 0.3318, - "eval_mar_1": 0.3167, - "eval_mar_10": 0.8306, - "eval_mar_100": 0.8352, - "eval_mar_100_chicken": 0.825, - "eval_mar_100_duck": 0.7876, - "eval_mar_100_plant": 0.893, - "eval_mar_large": 0.8371, - "eval_mar_medium": 0.839, - "eval_mar_small": 0.4348, - "eval_runtime": 12.8257, - "eval_samples_per_second": 7.797, - "eval_steps_per_second": 1.014, - "step": 52000 - }, - { - "epoch": 104.04, - "grad_norm": 50.39177322387695, - "learning_rate": 2.1429935415881753e-06, - "loss": 0.4251, - "step": 52020 - }, - { - "epoch": 104.1, - "grad_norm": 224.1273651123047, - "learning_rate": 2.137839372027047e-06, - "loss": 0.3165, - "step": 52050 - }, - { - "epoch": 104.16, - "grad_norm": 37.61375045776367, - "learning_rate": 2.132689722208223e-06, - "loss": 0.3781, - "step": 52080 - }, - { - "epoch": 104.22, - "grad_norm": 67.83102416992188, - "learning_rate": 2.1275446002637063e-06, - "loss": 0.4611, - "step": 52110 - }, - { - "epoch": 104.28, - "grad_norm": 77.93596649169922, - "learning_rate": 2.1224040143183444e-06, - "loss": 0.3957, - "step": 52140 - }, - { - "epoch": 104.34, - "grad_norm": 79.39508819580078, - "learning_rate": 2.1172679724898264e-06, - "loss": 0.4244, - "step": 52170 - }, - { - "epoch": 104.4, - "grad_norm": 55.841068267822266, - "learning_rate": 2.112136482888663e-06, - "loss": 0.4066, - "step": 52200 - }, - { - "epoch": 104.46, - "grad_norm": 115.12725830078125, - "learning_rate": 2.107009553618174e-06, - "loss": 0.37, - "step": 52230 - }, - { - "epoch": 104.52, - "grad_norm": 54.75588607788086, - "learning_rate": 2.1018871927744844e-06, - "loss": 0.4377, - "step": 52260 - }, - { - "epoch": 104.58, - "grad_norm": 39.3360710144043, - "learning_rate": 2.0967694084464973e-06, - "loss": 0.3612, - "step": 52290 - }, - { - "epoch": 104.64, - "grad_norm": 69.55204010009766, - "learning_rate": 2.0916562087158964e-06, - "loss": 0.3786, - "step": 52320 - }, - { - "epoch": 104.7, - "grad_norm": 29.990087509155273, - "learning_rate": 2.0865476016571206e-06, - "loss": 0.3462, - "step": 52350 - }, - { - "epoch": 104.76, - "grad_norm": 100.50167083740234, - "learning_rate": 2.0814435953373554e-06, - "loss": 0.3205, - "step": 52380 - }, - { - "epoch": 104.82, - "grad_norm": 65.78687286376953, - "learning_rate": 2.076344197816527e-06, - "loss": 0.4182, - "step": 52410 - }, - { - "epoch": 104.88, - "grad_norm": 88.50749206542969, - "learning_rate": 2.0712494171472776e-06, - "loss": 0.3723, - "step": 52440 - }, - { - "epoch": 104.94, - "grad_norm": 130.68087768554688, - "learning_rate": 2.066159261374964e-06, - "loss": 0.3144, - "step": 52470 - }, - { - "epoch": 105.0, - "grad_norm": 40.799720764160156, - "learning_rate": 2.061073738537635e-06, - "loss": 0.3236, - "step": 52500 - }, - { - "epoch": 105.0, - "eval_loss": 0.29966458678245544, - "eval_map": 0.7909, - "eval_map_50": 0.9607, - "eval_map_75": 0.9079, - "eval_map_chicken": 0.7767, - "eval_map_duck": 0.7373, - "eval_map_large": 0.8059, - "eval_map_medium": 0.7935, - "eval_map_plant": 0.8588, - "eval_map_small": 0.3475, - "eval_mar_1": 0.3149, - "eval_mar_10": 0.8265, - "eval_mar_100": 0.8323, - "eval_mar_100_chicken": 0.8206, - "eval_mar_100_duck": 0.7825, - "eval_mar_100_plant": 0.8939, - "eval_mar_large": 0.8405, - "eval_mar_medium": 0.8326, - "eval_mar_small": 0.4552, - "eval_runtime": 13.5342, - "eval_samples_per_second": 7.389, - "eval_steps_per_second": 0.961, - "step": 52500 - }, - { - "epoch": 105.06, - "grad_norm": 55.08608627319336, - "learning_rate": 2.0559928566660235e-06, - "loss": 0.3468, - "step": 52530 - }, - { - "epoch": 105.12, - "grad_norm": 46.37060546875, - "learning_rate": 2.0509166237835398e-06, - "loss": 0.3615, - "step": 52560 - }, - { - "epoch": 105.18, - "grad_norm": 64.0909194946289, - "learning_rate": 2.0458450479062465e-06, - "loss": 0.3162, - "step": 52590 - }, - { - "epoch": 105.24, - "grad_norm": 39.000423431396484, - "learning_rate": 2.040778137042852e-06, - "loss": 0.4154, - "step": 52620 - }, - { - "epoch": 105.3, - "grad_norm": 384.0572509765625, - "learning_rate": 2.035715899194704e-06, - "loss": 0.4825, - "step": 52650 - }, - { - "epoch": 105.36, - "grad_norm": 68.53567504882812, - "learning_rate": 2.030658342355765e-06, - "loss": 0.344, - "step": 52680 - }, - { - "epoch": 105.42, - "grad_norm": 43.619197845458984, - "learning_rate": 2.025605474512608e-06, - "loss": 0.412, - "step": 52710 - }, - { - "epoch": 105.48, - "grad_norm": 38.31523132324219, - "learning_rate": 2.0205573036443994e-06, - "loss": 0.3037, - "step": 52740 - }, - { - "epoch": 105.54, - "grad_norm": 56.94728088378906, - "learning_rate": 2.0155138377228924e-06, - "loss": 0.4071, - "step": 52770 - }, - { - "epoch": 105.6, - "grad_norm": 76.192626953125, - "learning_rate": 2.0104750847124075e-06, - "loss": 0.3733, - "step": 52800 - }, - { - "epoch": 105.66, - "grad_norm": 94.97992706298828, - "learning_rate": 2.0054410525698217e-06, - "loss": 0.3688, - "step": 52830 - }, - { - "epoch": 105.72, - "grad_norm": 53.94303512573242, - "learning_rate": 2.0004117492445614e-06, - "loss": 0.408, - "step": 52860 - }, - { - "epoch": 105.78, - "grad_norm": 39.50190353393555, - "learning_rate": 1.9953871826785804e-06, - "loss": 0.357, - "step": 52890 - }, - { - "epoch": 105.84, - "grad_norm": 47.59618377685547, - "learning_rate": 1.990367360806359e-06, - "loss": 0.4536, - "step": 52920 - }, - { - "epoch": 105.9, - "grad_norm": 65.47077941894531, - "learning_rate": 1.9853522915548777e-06, - "loss": 0.3725, - "step": 52950 - }, - { - "epoch": 105.96, - "grad_norm": 64.24626159667969, - "learning_rate": 1.980341982843616e-06, - "loss": 0.3559, - "step": 52980 - }, - { - "epoch": 106.0, - "eval_loss": 0.2986926734447479, - "eval_map": 0.7918, - "eval_map_50": 0.9599, - "eval_map_75": 0.9093, - "eval_map_chicken": 0.7782, - "eval_map_duck": 0.7367, - "eval_map_large": 0.8102, - "eval_map_medium": 0.8003, - "eval_map_plant": 0.8606, - "eval_map_small": 0.3328, - "eval_mar_1": 0.3167, - "eval_mar_10": 0.8294, - "eval_mar_100": 0.8358, - "eval_mar_100_chicken": 0.8278, - "eval_mar_100_duck": 0.7856, - "eval_mar_100_plant": 0.8939, - "eval_mar_large": 0.8494, - "eval_mar_medium": 0.8392, - "eval_mar_small": 0.4367, - "eval_runtime": 14.3693, - "eval_samples_per_second": 6.959, - "eval_steps_per_second": 0.905, - "step": 53000 - }, - { - "epoch": 106.02, - "grad_norm": 446.3773498535156, - "learning_rate": 1.975336442584537e-06, - "loss": 0.3964, - "step": 53010 - }, - { - "epoch": 106.08, - "grad_norm": 54.21070861816406, - "learning_rate": 1.9703356786820687e-06, - "loss": 0.3464, - "step": 53040 - }, - { - "epoch": 106.14, - "grad_norm": 42.08112716674805, - "learning_rate": 1.9653396990331043e-06, - "loss": 0.3222, - "step": 53070 - }, - { - "epoch": 106.2, - "grad_norm": 111.56007385253906, - "learning_rate": 1.9603485115269743e-06, - "loss": 0.3567, - "step": 53100 - }, - { - "epoch": 106.26, - "grad_norm": 57.83928680419922, - "learning_rate": 1.955362124045445e-06, - "loss": 0.3416, - "step": 53130 - }, - { - "epoch": 106.32, - "grad_norm": 49.74007797241211, - "learning_rate": 1.9503805444627054e-06, - "loss": 0.3262, - "step": 53160 - }, - { - "epoch": 106.38, - "grad_norm": 27.027053833007812, - "learning_rate": 1.945403780645346e-06, - "loss": 0.4011, - "step": 53190 - }, - { - "epoch": 106.44, - "grad_norm": 50.88391876220703, - "learning_rate": 1.9404318404523605e-06, - "loss": 0.338, - "step": 53220 - }, - { - "epoch": 106.5, - "grad_norm": 55.862789154052734, - "learning_rate": 1.9354647317351187e-06, - "loss": 0.4111, - "step": 53250 - }, - { - "epoch": 106.56, - "grad_norm": 97.4269027709961, - "learning_rate": 1.930502462337362e-06, - "loss": 0.3457, - "step": 53280 - }, - { - "epoch": 106.62, - "grad_norm": 52.87917709350586, - "learning_rate": 1.9255450400951937e-06, - "loss": 0.472, - "step": 53310 - }, - { - "epoch": 106.68, - "grad_norm": 59.95462417602539, - "learning_rate": 1.920592472837057e-06, - "loss": 0.3568, - "step": 53340 - }, - { - "epoch": 106.74, - "grad_norm": 52.46572494506836, - "learning_rate": 1.9156447683837365e-06, - "loss": 0.4044, - "step": 53370 - }, - { - "epoch": 106.8, - "grad_norm": 42.97385787963867, - "learning_rate": 1.910701934548329e-06, - "loss": 0.3087, - "step": 53400 - }, - { - "epoch": 106.86, - "grad_norm": 58.958274841308594, - "learning_rate": 1.9057639791362437e-06, - "loss": 0.3998, - "step": 53430 - }, - { - "epoch": 106.92, - "grad_norm": 59.075439453125, - "learning_rate": 1.900830909945189e-06, - "loss": 0.3815, - "step": 53460 - }, - { - "epoch": 106.98, - "grad_norm": 41.899375915527344, - "learning_rate": 1.8959027347651527e-06, - "loss": 0.39, - "step": 53490 - }, - { - "epoch": 107.0, - "eval_loss": 0.3079011142253876, - "eval_map": 0.7835, - "eval_map_50": 0.961, - "eval_map_75": 0.9054, - "eval_map_chicken": 0.7606, - "eval_map_duck": 0.7349, - "eval_map_large": 0.7968, - "eval_map_medium": 0.7855, - "eval_map_plant": 0.8551, - "eval_map_small": 0.3091, - "eval_mar_1": 0.3115, - "eval_mar_10": 0.8186, - "eval_mar_100": 0.8253, - "eval_mar_100_chicken": 0.8079, - "eval_mar_100_duck": 0.7784, - "eval_mar_100_plant": 0.8897, - "eval_mar_large": 0.8377, - "eval_mar_medium": 0.8258, - "eval_mar_small": 0.409, - "eval_runtime": 13.9921, - "eval_samples_per_second": 7.147, - "eval_steps_per_second": 0.929, - "step": 53500 - }, - { - "epoch": 107.04, - "grad_norm": 37.67574691772461, - "learning_rate": 1.8909794613783943e-06, - "loss": 0.4248, - "step": 53520 - }, - { - "epoch": 107.1, - "grad_norm": 130.4075164794922, - "learning_rate": 1.8860610975594384e-06, - "loss": 0.3677, - "step": 53550 - }, - { - "epoch": 107.16, - "grad_norm": 74.20655822753906, - "learning_rate": 1.8811476510750486e-06, - "loss": 0.439, - "step": 53580 - }, - { - "epoch": 107.22, - "grad_norm": 49.37228775024414, - "learning_rate": 1.876239129684232e-06, - "loss": 0.3681, - "step": 53610 - }, - { - "epoch": 107.28, - "grad_norm": 113.44561004638672, - "learning_rate": 1.8713355411382117e-06, - "loss": 0.389, - "step": 53640 - }, - { - "epoch": 107.34, - "grad_norm": 0.00013752943777944893, - "learning_rate": 1.8664368931804211e-06, - "loss": 0.3334, - "step": 53670 - }, - { - "epoch": 107.4, - "grad_norm": 83.08969116210938, - "learning_rate": 1.8615431935464984e-06, - "loss": 0.3648, - "step": 53700 - }, - { - "epoch": 107.46, - "grad_norm": 139.56890869140625, - "learning_rate": 1.8566544499642587e-06, - "loss": 0.3751, - "step": 53730 - }, - { - "epoch": 107.52, - "grad_norm": 99.85262298583984, - "learning_rate": 1.8517706701536998e-06, - "loss": 0.4039, - "step": 53760 - }, - { - "epoch": 107.58, - "grad_norm": 54.01030349731445, - "learning_rate": 1.8468918618269749e-06, - "loss": 0.3843, - "step": 53790 - }, - { - "epoch": 107.64, - "grad_norm": 38.08380126953125, - "learning_rate": 1.8420180326883857e-06, - "loss": 0.3723, - "step": 53820 - }, - { - "epoch": 107.7, - "grad_norm": 61.52556228637695, - "learning_rate": 1.837149190434378e-06, - "loss": 0.3631, - "step": 53850 - }, - { - "epoch": 107.76, - "grad_norm": 69.80587005615234, - "learning_rate": 1.8322853427535148e-06, - "loss": 0.453, - "step": 53880 - }, - { - "epoch": 107.82, - "grad_norm": 38.5218505859375, - "learning_rate": 1.8274264973264782e-06, - "loss": 0.3513, - "step": 53910 - }, - { - "epoch": 107.88, - "grad_norm": 130.12522888183594, - "learning_rate": 1.822572661826047e-06, - "loss": 0.4019, - "step": 53940 - }, - { - "epoch": 107.94, - "grad_norm": 101.6468734741211, - "learning_rate": 1.8177238439170885e-06, - "loss": 0.3957, - "step": 53970 - }, - { - "epoch": 108.0, - "grad_norm": 304.1820373535156, - "learning_rate": 1.8128800512565514e-06, - "loss": 0.362, - "step": 54000 - }, - { - "epoch": 108.0, - "eval_loss": 0.2971864938735962, - "eval_map": 0.7924, - "eval_map_50": 0.9578, - "eval_map_75": 0.905, - "eval_map_chicken": 0.7803, - "eval_map_duck": 0.7422, - "eval_map_large": 0.8132, - "eval_map_medium": 0.7963, - "eval_map_plant": 0.8548, - "eval_map_small": 0.3031, - "eval_mar_1": 0.3145, - "eval_mar_10": 0.8291, - "eval_mar_100": 0.8352, - "eval_mar_100_chicken": 0.8234, - "eval_mar_100_duck": 0.7918, - "eval_mar_100_plant": 0.8903, - "eval_mar_large": 0.8524, - "eval_mar_medium": 0.8369, - "eval_mar_small": 0.4043, - "eval_runtime": 14.1627, - "eval_samples_per_second": 7.061, - "eval_steps_per_second": 0.918, - "step": 54000 - }, - { - "epoch": 108.06, - "grad_norm": 173.47152709960938, - "learning_rate": 1.8080412914934436e-06, - "loss": 0.3673, - "step": 54030 - }, - { - "epoch": 108.12, - "grad_norm": 94.0256118774414, - "learning_rate": 1.803207572268826e-06, - "loss": 0.3726, - "step": 54060 - }, - { - "epoch": 108.18, - "grad_norm": 98.87445831298828, - "learning_rate": 1.7983789012158037e-06, - "loss": 0.3516, - "step": 54090 - }, - { - "epoch": 108.24, - "grad_norm": 60.777549743652344, - "learning_rate": 1.7935552859595058e-06, - "loss": 0.4112, - "step": 54120 - }, - { - "epoch": 108.3, - "grad_norm": 38.98394775390625, - "learning_rate": 1.7887367341170781e-06, - "loss": 0.4322, - "step": 54150 - }, - { - "epoch": 108.36, - "grad_norm": 74.89652252197266, - "learning_rate": 1.7839232532976746e-06, - "loss": 0.3607, - "step": 54180 - }, - { - "epoch": 108.42, - "grad_norm": 70.75282287597656, - "learning_rate": 1.779114851102437e-06, - "loss": 0.4569, - "step": 54210 - }, - { - "epoch": 108.48, - "grad_norm": 65.15149688720703, - "learning_rate": 1.7743115351244883e-06, - "loss": 0.3689, - "step": 54240 - }, - { - "epoch": 108.54, - "grad_norm": 27.904132843017578, - "learning_rate": 1.769513312948919e-06, - "loss": 0.3312, - "step": 54270 - }, - { - "epoch": 108.6, - "grad_norm": 36.908485412597656, - "learning_rate": 1.7647201921527802e-06, - "loss": 0.3783, - "step": 54300 - }, - { - "epoch": 108.66, - "grad_norm": 102.91898345947266, - "learning_rate": 1.7599321803050595e-06, - "loss": 0.338, - "step": 54330 - }, - { - "epoch": 108.72, - "grad_norm": 36.946815490722656, - "learning_rate": 1.7551492849666857e-06, - "loss": 0.4, - "step": 54360 - }, - { - "epoch": 108.78, - "grad_norm": 38.67084503173828, - "learning_rate": 1.7503715136905014e-06, - "loss": 0.5506, - "step": 54390 - }, - { - "epoch": 108.84, - "grad_norm": 117.760498046875, - "learning_rate": 1.7455988740212576e-06, - "loss": 0.3726, - "step": 54420 - }, - { - "epoch": 108.9, - "grad_norm": 364.3804626464844, - "learning_rate": 1.7408313734956074e-06, - "loss": 0.4103, - "step": 54450 - }, - { - "epoch": 108.96, - "grad_norm": 56.165340423583984, - "learning_rate": 1.7360690196420816e-06, - "loss": 0.3628, - "step": 54480 - }, - { - "epoch": 109.0, - "eval_loss": 0.3163011074066162, - "eval_map": 0.7773, - "eval_map_50": 0.9624, - "eval_map_75": 0.9104, - "eval_map_chicken": 0.7642, - "eval_map_duck": 0.7221, - "eval_map_large": 0.7896, - "eval_map_medium": 0.7826, - "eval_map_plant": 0.8457, - "eval_map_small": 0.3353, - "eval_mar_1": 0.3092, - "eval_mar_10": 0.8181, - "eval_mar_100": 0.8238, - "eval_mar_100_chicken": 0.8131, - "eval_mar_100_duck": 0.7732, - "eval_mar_100_plant": 0.8852, - "eval_mar_large": 0.8397, - "eval_mar_medium": 0.8235, - "eval_mar_small": 0.4433, - "eval_runtime": 12.7216, - "eval_samples_per_second": 7.861, - "eval_steps_per_second": 1.022, - "step": 54500 - }, - { - "epoch": 109.02, - "grad_norm": 51.046871185302734, - "learning_rate": 1.7313118199810897e-06, - "loss": 0.2856, - "step": 54510 - }, - { - "epoch": 109.08, - "grad_norm": 83.52461242675781, - "learning_rate": 1.7265597820248987e-06, - "loss": 0.3736, - "step": 54540 - }, - { - "epoch": 109.14, - "grad_norm": 41.98723220825195, - "learning_rate": 1.7218129132776224e-06, - "loss": 0.3412, - "step": 54570 - }, - { - "epoch": 109.2, - "grad_norm": 31.22188949584961, - "learning_rate": 1.7170712212352187e-06, - "loss": 0.3972, - "step": 54600 - }, - { - "epoch": 109.26, - "grad_norm": 0.0001550310116726905, - "learning_rate": 1.7123347133854628e-06, - "loss": 0.313, - "step": 54630 - }, - { - "epoch": 109.32, - "grad_norm": 33.59311294555664, - "learning_rate": 1.7076033972079503e-06, - "loss": 0.4468, - "step": 54660 - }, - { - "epoch": 109.38, - "grad_norm": 44.10573196411133, - "learning_rate": 1.702877280174074e-06, - "loss": 0.3232, - "step": 54690 - }, - { - "epoch": 109.44, - "grad_norm": 26.812898635864258, - "learning_rate": 1.698156369747016e-06, - "loss": 0.3372, - "step": 54720 - }, - { - "epoch": 109.5, - "grad_norm": 48.606201171875, - "learning_rate": 1.6934406733817417e-06, - "loss": 0.3288, - "step": 54750 - }, - { - "epoch": 109.56, - "grad_norm": 109.12932586669922, - "learning_rate": 1.6887301985249754e-06, - "loss": 0.3282, - "step": 54780 - }, - { - "epoch": 109.62, - "grad_norm": 0.00013426481746137142, - "learning_rate": 1.6840249526152036e-06, - "loss": 0.34, - "step": 54810 - }, - { - "epoch": 109.68, - "grad_norm": 46.39686965942383, - "learning_rate": 1.6793249430826502e-06, - "loss": 0.3614, - "step": 54840 - }, - { - "epoch": 109.74, - "grad_norm": 67.07842254638672, - "learning_rate": 1.6746301773492701e-06, - "loss": 0.3838, - "step": 54870 - }, - { - "epoch": 109.8, - "grad_norm": 39.00133514404297, - "learning_rate": 1.6699406628287423e-06, - "loss": 0.3681, - "step": 54900 - }, - { - "epoch": 109.86, - "grad_norm": 66.28092956542969, - "learning_rate": 1.6652564069264476e-06, - "loss": 0.3662, - "step": 54930 - }, - { - "epoch": 109.92, - "grad_norm": 111.6198501586914, - "learning_rate": 1.6605774170394683e-06, - "loss": 0.3625, - "step": 54960 - }, - { - "epoch": 109.98, - "grad_norm": 81.31076049804688, - "learning_rate": 1.6559037005565665e-06, - "loss": 0.3574, - "step": 54990 - }, - { - "epoch": 110.0, - "eval_loss": 0.3099856972694397, - "eval_map": 0.781, - "eval_map_50": 0.9617, - "eval_map_75": 0.9053, - "eval_map_chicken": 0.7664, - "eval_map_duck": 0.7253, - "eval_map_large": 0.806, - "eval_map_medium": 0.7829, - "eval_map_plant": 0.8511, - "eval_map_small": 0.3376, - "eval_mar_1": 0.3118, - "eval_mar_10": 0.82, - "eval_mar_100": 0.8256, - "eval_mar_100_chicken": 0.8147, - "eval_mar_100_duck": 0.7753, - "eval_mar_100_plant": 0.887, - "eval_mar_large": 0.8469, - "eval_mar_medium": 0.8243, - "eval_mar_small": 0.4252, - "eval_runtime": 12.2209, - "eval_samples_per_second": 8.183, - "eval_steps_per_second": 1.064, - "step": 55000 - }, - { - "epoch": 110.04, - "grad_norm": 40.21201705932617, - "learning_rate": 1.651235264858177e-06, - "loss": 0.3335, - "step": 55020 - }, - { - "epoch": 110.1, - "grad_norm": 28.124114990234375, - "learning_rate": 1.6465721173164e-06, - "loss": 0.3032, - "step": 55050 - }, - { - "epoch": 110.16, - "grad_norm": 33.553504943847656, - "learning_rate": 1.6419142652949793e-06, - "loss": 0.2974, - "step": 55080 - }, - { - "epoch": 110.22, - "grad_norm": 41.741764068603516, - "learning_rate": 1.6372617161493014e-06, - "loss": 0.4531, - "step": 55110 - }, - { - "epoch": 110.28, - "grad_norm": 88.8398208618164, - "learning_rate": 1.6326144772263752e-06, - "loss": 0.4221, - "step": 55140 - }, - { - "epoch": 110.34, - "grad_norm": 63.48917007446289, - "learning_rate": 1.627972555864824e-06, - "loss": 0.3719, - "step": 55170 - }, - { - "epoch": 110.4, - "grad_norm": 35.19669723510742, - "learning_rate": 1.6233359593948777e-06, - "loss": 0.3571, - "step": 55200 - }, - { - "epoch": 110.46, - "grad_norm": 39.2208137512207, - "learning_rate": 1.618704695138353e-06, - "loss": 0.4188, - "step": 55230 - }, - { - "epoch": 110.52, - "grad_norm": 67.35260009765625, - "learning_rate": 1.6140787704086502e-06, - "loss": 0.283, - "step": 55260 - }, - { - "epoch": 110.58, - "grad_norm": 83.15595245361328, - "learning_rate": 1.6094581925107356e-06, - "loss": 0.5104, - "step": 55290 - }, - { - "epoch": 110.64, - "grad_norm": 67.90478515625, - "learning_rate": 1.6048429687411294e-06, - "loss": 0.4915, - "step": 55320 - }, - { - "epoch": 110.7, - "grad_norm": 63.72685623168945, - "learning_rate": 1.600233106387904e-06, - "loss": 0.3097, - "step": 55350 - }, - { - "epoch": 110.76, - "grad_norm": 56.029056549072266, - "learning_rate": 1.5956286127306591e-06, - "loss": 0.4279, - "step": 55380 - }, - { - "epoch": 110.82, - "grad_norm": 81.89627075195312, - "learning_rate": 1.591029495040518e-06, - "loss": 0.3538, - "step": 55410 - }, - { - "epoch": 110.88, - "grad_norm": 53.46123504638672, - "learning_rate": 1.586435760580118e-06, - "loss": 0.3456, - "step": 55440 - }, - { - "epoch": 110.94, - "grad_norm": 65.57443237304688, - "learning_rate": 1.5818474166035907e-06, - "loss": 0.3723, - "step": 55470 - }, - { - "epoch": 111.0, - "grad_norm": 80.52845764160156, - "learning_rate": 1.5772644703565564e-06, - "loss": 0.368, - "step": 55500 - }, - { - "epoch": 111.0, - "eval_loss": 0.2932773530483246, - "eval_map": 0.7928, - "eval_map_50": 0.9593, - "eval_map_75": 0.9002, - "eval_map_chicken": 0.79, - "eval_map_duck": 0.7313, - "eval_map_large": 0.8223, - "eval_map_medium": 0.7956, - "eval_map_plant": 0.857, - "eval_map_small": 0.3206, - "eval_mar_1": 0.3186, - "eval_mar_10": 0.8282, - "eval_mar_100": 0.8351, - "eval_mar_100_chicken": 0.8365, - "eval_mar_100_duck": 0.7753, - "eval_mar_100_plant": 0.8936, - "eval_mar_large": 0.8599, - "eval_mar_medium": 0.8349, - "eval_mar_small": 0.4252, - "eval_runtime": 13.1758, - "eval_samples_per_second": 7.59, - "eval_steps_per_second": 0.987, - "step": 55500 - }, - { - "epoch": 111.06, - "grad_norm": 32.08183670043945, - "learning_rate": 1.572686929076116e-06, - "loss": 0.3991, - "step": 55530 - }, - { - "epoch": 111.12, - "grad_norm": 39.98676681518555, - "learning_rate": 1.5681147999908308e-06, - "loss": 0.3826, - "step": 55560 - }, - { - "epoch": 111.18, - "grad_norm": 29.21529769897461, - "learning_rate": 1.5635480903207139e-06, - "loss": 0.3157, - "step": 55590 - }, - { - "epoch": 111.24, - "grad_norm": 42.81616973876953, - "learning_rate": 1.5589868072772279e-06, - "loss": 0.4127, - "step": 55620 - }, - { - "epoch": 111.3, - "grad_norm": 85.20896911621094, - "learning_rate": 1.554430958063259e-06, - "loss": 0.4262, - "step": 55650 - }, - { - "epoch": 111.36, - "grad_norm": 107.23535919189453, - "learning_rate": 1.5498805498731146e-06, - "loss": 0.3838, - "step": 55680 - }, - { - "epoch": 111.42, - "grad_norm": 52.67665481567383, - "learning_rate": 1.5453355898925094e-06, - "loss": 0.4067, - "step": 55710 - }, - { - "epoch": 111.48, - "grad_norm": 75.49931335449219, - "learning_rate": 1.5407960852985582e-06, - "loss": 0.3932, - "step": 55740 - }, - { - "epoch": 111.54, - "grad_norm": 85.12210083007812, - "learning_rate": 1.5362620432597559e-06, - "loss": 0.3752, - "step": 55770 - }, - { - "epoch": 111.6, - "grad_norm": 76.16122436523438, - "learning_rate": 1.531733470935976e-06, - "loss": 0.3884, - "step": 55800 - }, - { - "epoch": 111.66, - "grad_norm": 65.58129119873047, - "learning_rate": 1.5272103754784517e-06, - "loss": 0.3909, - "step": 55830 - }, - { - "epoch": 111.72, - "grad_norm": 118.35000610351562, - "learning_rate": 1.5226927640297663e-06, - "loss": 0.2849, - "step": 55860 - }, - { - "epoch": 111.78, - "grad_norm": 69.42806243896484, - "learning_rate": 1.5181806437238472e-06, - "loss": 0.4117, - "step": 55890 - }, - { - "epoch": 111.84, - "grad_norm": 28.676090240478516, - "learning_rate": 1.5136740216859464e-06, - "loss": 0.4249, - "step": 55920 - }, - { - "epoch": 111.9, - "grad_norm": 43.85958480834961, - "learning_rate": 1.5091729050326376e-06, - "loss": 0.3355, - "step": 55950 - }, - { - "epoch": 111.96, - "grad_norm": 48.95738983154297, - "learning_rate": 1.5046773008717968e-06, - "loss": 0.3394, - "step": 55980 - }, - { - "epoch": 112.0, - "eval_loss": 0.2972817122936249, - "eval_map": 0.792, - "eval_map_50": 0.9547, - "eval_map_75": 0.9061, - "eval_map_chicken": 0.7841, - "eval_map_duck": 0.7361, - "eval_map_large": 0.8306, - "eval_map_medium": 0.7922, - "eval_map_plant": 0.8559, - "eval_map_small": 0.3368, - "eval_mar_1": 0.3146, - "eval_mar_10": 0.827, - "eval_mar_100": 0.8325, - "eval_mar_100_chicken": 0.8294, - "eval_mar_100_duck": 0.7763, - "eval_mar_100_plant": 0.8918, - "eval_mar_large": 0.8643, - "eval_mar_medium": 0.83, - "eval_mar_small": 0.4029, - "eval_runtime": 14.2322, - "eval_samples_per_second": 7.026, - "eval_steps_per_second": 0.913, - "step": 56000 - }, - { - "epoch": 112.02, - "grad_norm": 252.1146240234375, - "learning_rate": 1.5001872163025954e-06, - "loss": 0.5405, - "step": 56010 - }, - { - "epoch": 112.08, - "grad_norm": 88.07685089111328, - "learning_rate": 1.4957026584154926e-06, - "loss": 0.3314, - "step": 56040 - }, - { - "epoch": 112.14, - "grad_norm": 74.59980773925781, - "learning_rate": 1.4912236342922143e-06, - "loss": 0.3907, - "step": 56070 - }, - { - "epoch": 112.2, - "grad_norm": 93.63352966308594, - "learning_rate": 1.4867501510057548e-06, - "loss": 0.3988, - "step": 56100 - }, - { - "epoch": 112.26, - "grad_norm": 31.659984588623047, - "learning_rate": 1.482282215620352e-06, - "loss": 0.318, - "step": 56130 - }, - { - "epoch": 112.32, - "grad_norm": 97.10539245605469, - "learning_rate": 1.4778198351914853e-06, - "loss": 0.4266, - "step": 56160 - }, - { - "epoch": 112.38, - "grad_norm": 135.10064697265625, - "learning_rate": 1.4733630167658652e-06, - "loss": 0.394, - "step": 56190 - }, - { - "epoch": 112.44, - "grad_norm": 58.0966911315918, - "learning_rate": 1.4689117673814135e-06, - "loss": 0.3845, - "step": 56220 - }, - { - "epoch": 112.5, - "grad_norm": 453.5458984375, - "learning_rate": 1.4644660940672628e-06, - "loss": 0.4354, - "step": 56250 - }, - { - "epoch": 112.56, - "grad_norm": 85.53357696533203, - "learning_rate": 1.4600260038437376e-06, - "loss": 0.3829, - "step": 56280 - }, - { - "epoch": 112.62, - "grad_norm": 73.85929107666016, - "learning_rate": 1.4555915037223438e-06, - "loss": 0.3584, - "step": 56310 - }, - { - "epoch": 112.68, - "grad_norm": 56.37699890136719, - "learning_rate": 1.4511626007057667e-06, - "loss": 0.3209, - "step": 56340 - }, - { - "epoch": 112.74, - "grad_norm": 48.00393295288086, - "learning_rate": 1.4467393017878444e-06, - "loss": 0.3399, - "step": 56370 - }, - { - "epoch": 112.8, - "grad_norm": 115.49342346191406, - "learning_rate": 1.4423216139535735e-06, - "loss": 0.3958, - "step": 56400 - }, - { - "epoch": 112.86, - "grad_norm": 76.94721221923828, - "learning_rate": 1.4379095441790847e-06, - "loss": 0.3699, - "step": 56430 - }, - { - "epoch": 112.92, - "grad_norm": 41.330772399902344, - "learning_rate": 1.4335030994316357e-06, - "loss": 0.3947, - "step": 56460 - }, - { - "epoch": 112.98, - "grad_norm": 63.65792465209961, - "learning_rate": 1.4291022866696086e-06, - "loss": 0.3677, - "step": 56490 - }, - { - "epoch": 113.0, - "eval_loss": 0.29187893867492676, - "eval_map": 0.7984, - "eval_map_50": 0.9604, - "eval_map_75": 0.9117, - "eval_map_chicken": 0.7855, - "eval_map_duck": 0.7524, - "eval_map_large": 0.8247, - "eval_map_medium": 0.7988, - "eval_map_plant": 0.8574, - "eval_map_small": 0.3672, - "eval_mar_1": 0.3174, - "eval_mar_10": 0.8343, - "eval_mar_100": 0.8398, - "eval_mar_100_chicken": 0.8321, - "eval_mar_100_duck": 0.7938, - "eval_mar_100_plant": 0.8933, - "eval_mar_large": 0.8588, - "eval_mar_medium": 0.837, - "eval_mar_small": 0.4433, - "eval_runtime": 13.2013, - "eval_samples_per_second": 7.575, - "eval_steps_per_second": 0.985, - "step": 56500 - }, - { - "epoch": 113.04, - "grad_norm": 54.97718048095703, - "learning_rate": 1.4247071128424838e-06, - "loss": 0.4341, - "step": 56520 - }, - { - "epoch": 113.1, - "grad_norm": 35.49183654785156, - "learning_rate": 1.420317584890844e-06, - "loss": 0.4105, - "step": 56550 - }, - { - "epoch": 113.16, - "grad_norm": 32.6884880065918, - "learning_rate": 1.4159337097463515e-06, - "loss": 0.4421, - "step": 56580 - }, - { - "epoch": 113.22, - "grad_norm": 64.88768005371094, - "learning_rate": 1.4115554943317416e-06, - "loss": 0.3604, - "step": 56610 - }, - { - "epoch": 113.28, - "grad_norm": 31.727033615112305, - "learning_rate": 1.407182945560817e-06, - "loss": 0.4024, - "step": 56640 - }, - { - "epoch": 113.34, - "grad_norm": 43.41179656982422, - "learning_rate": 1.402816070338427e-06, - "loss": 0.3722, - "step": 56670 - }, - { - "epoch": 113.4, - "grad_norm": 51.2356071472168, - "learning_rate": 1.3984548755604655e-06, - "loss": 0.3619, - "step": 56700 - }, - { - "epoch": 113.46, - "grad_norm": 73.18277740478516, - "learning_rate": 1.3940993681138533e-06, - "loss": 0.3624, - "step": 56730 - }, - { - "epoch": 113.52, - "grad_norm": 60.43366241455078, - "learning_rate": 1.38974955487653e-06, - "loss": 0.3175, - "step": 56760 - }, - { - "epoch": 113.58, - "grad_norm": 33.95436096191406, - "learning_rate": 1.3854054427174468e-06, - "loss": 0.4596, - "step": 56790 - }, - { - "epoch": 113.64, - "grad_norm": 103.40779876708984, - "learning_rate": 1.3810670384965469e-06, - "loss": 0.3958, - "step": 56820 - }, - { - "epoch": 113.7, - "grad_norm": 75.7718505859375, - "learning_rate": 1.3767343490647668e-06, - "loss": 0.3696, - "step": 56850 - }, - { - "epoch": 113.76, - "grad_norm": 33.47903060913086, - "learning_rate": 1.372407381264011e-06, - "loss": 0.4226, - "step": 56880 - }, - { - "epoch": 113.82, - "grad_norm": 264.2909240722656, - "learning_rate": 1.368086141927154e-06, - "loss": 0.3534, - "step": 56910 - }, - { - "epoch": 113.88, - "grad_norm": 35.629364013671875, - "learning_rate": 1.3637706378780209e-06, - "loss": 0.3504, - "step": 56940 - }, - { - "epoch": 113.94, - "grad_norm": 103.62637329101562, - "learning_rate": 1.3594608759313832e-06, - "loss": 0.4638, - "step": 56970 - }, - { - "epoch": 114.0, - "grad_norm": 50.443546295166016, - "learning_rate": 1.3551568628929434e-06, - "loss": 0.3681, - "step": 57000 - }, - { - "epoch": 114.0, - "eval_loss": 0.3044111430644989, - "eval_map": 0.7833, - "eval_map_50": 0.9586, - "eval_map_75": 0.8961, - "eval_map_chicken": 0.7709, - "eval_map_duck": 0.7311, - "eval_map_large": 0.8076, - "eval_map_medium": 0.786, - "eval_map_plant": 0.848, - "eval_map_small": 0.326, - "eval_mar_1": 0.3116, - "eval_mar_10": 0.8207, - "eval_mar_100": 0.8256, - "eval_mar_100_chicken": 0.8179, - "eval_mar_100_duck": 0.7732, - "eval_mar_100_plant": 0.8858, - "eval_mar_large": 0.8483, - "eval_mar_medium": 0.8261, - "eval_mar_small": 0.3905, - "eval_runtime": 13.853, - "eval_samples_per_second": 7.219, - "eval_steps_per_second": 0.938, - "step": 57000 - }, - { - "epoch": 114.06, - "grad_norm": 0.00010968352580675855, - "learning_rate": 1.350858605559323e-06, - "loss": 0.3761, - "step": 57030 - }, - { - "epoch": 114.12, - "grad_norm": 48.614933013916016, - "learning_rate": 1.346566110718061e-06, - "loss": 0.3686, - "step": 57060 - }, - { - "epoch": 114.18, - "grad_norm": 125.78142547607422, - "learning_rate": 1.3422793851475907e-06, - "loss": 0.3757, - "step": 57090 - }, - { - "epoch": 114.24, - "grad_norm": 0.00011565905879251659, - "learning_rate": 1.337998435617235e-06, - "loss": 0.3602, - "step": 57120 - }, - { - "epoch": 114.3, - "grad_norm": 96.23841094970703, - "learning_rate": 1.333723268887201e-06, - "loss": 0.3008, - "step": 57150 - }, - { - "epoch": 114.36, - "grad_norm": 62.80172348022461, - "learning_rate": 1.3294538917085586e-06, - "loss": 0.4119, - "step": 57180 - }, - { - "epoch": 114.42, - "grad_norm": 93.47703552246094, - "learning_rate": 1.3251903108232362e-06, - "loss": 0.3799, - "step": 57210 - }, - { - "epoch": 114.48, - "grad_norm": 52.14104461669922, - "learning_rate": 1.3209325329640126e-06, - "loss": 0.3715, - "step": 57240 - }, - { - "epoch": 114.54, - "grad_norm": 0.00017110643966589123, - "learning_rate": 1.316680564854499e-06, - "loss": 0.3831, - "step": 57270 - }, - { - "epoch": 114.6, - "grad_norm": 35.94871520996094, - "learning_rate": 1.312434413209131e-06, - "loss": 0.4229, - "step": 57300 - }, - { - "epoch": 114.66, - "grad_norm": 167.53306579589844, - "learning_rate": 1.3081940847331658e-06, - "loss": 0.3543, - "step": 57330 - }, - { - "epoch": 114.72, - "grad_norm": 104.39117431640625, - "learning_rate": 1.3039595861226579e-06, - "loss": 0.3481, - "step": 57360 - }, - { - "epoch": 114.78, - "grad_norm": 91.05123138427734, - "learning_rate": 1.2997309240644607e-06, - "loss": 0.3372, - "step": 57390 - }, - { - "epoch": 114.84, - "grad_norm": 74.6148910522461, - "learning_rate": 1.2955081052362072e-06, - "loss": 0.3995, - "step": 57420 - }, - { - "epoch": 114.9, - "grad_norm": 137.8092041015625, - "learning_rate": 1.2912911363063048e-06, - "loss": 0.3057, - "step": 57450 - }, - { - "epoch": 114.96, - "grad_norm": 110.8732681274414, - "learning_rate": 1.2870800239339237e-06, - "loss": 0.3562, - "step": 57480 - }, - { - "epoch": 115.0, - "eval_loss": 0.2903619110584259, - "eval_map": 0.7918, - "eval_map_50": 0.9632, - "eval_map_75": 0.8991, - "eval_map_chicken": 0.7843, - "eval_map_duck": 0.7299, - "eval_map_large": 0.8148, - "eval_map_medium": 0.793, - "eval_map_plant": 0.8612, - "eval_map_small": 0.3676, - "eval_mar_1": 0.3128, - "eval_mar_10": 0.8293, - "eval_mar_100": 0.8339, - "eval_mar_100_chicken": 0.827, - "eval_mar_100_duck": 0.7804, - "eval_mar_100_plant": 0.8942, - "eval_mar_large": 0.8539, - "eval_mar_medium": 0.8345, - "eval_mar_small": 0.4362, - "eval_runtime": 12.7646, - "eval_samples_per_second": 7.834, - "eval_steps_per_second": 1.018, - "step": 57500 - }, - { - "epoch": 115.02, - "grad_norm": 53.309932708740234, - "learning_rate": 1.2828747747689846e-06, - "loss": 0.4409, - "step": 57510 - }, - { - "epoch": 115.08, - "grad_norm": 59.835693359375, - "learning_rate": 1.2786753954521508e-06, - "loss": 0.3894, - "step": 57540 - }, - { - "epoch": 115.14, - "grad_norm": 53.01243209838867, - "learning_rate": 1.2744818926148157e-06, - "loss": 0.3477, - "step": 57570 - }, - { - "epoch": 115.2, - "grad_norm": 55.61727523803711, - "learning_rate": 1.2702942728790897e-06, - "loss": 0.383, - "step": 57600 - }, - { - "epoch": 115.26, - "grad_norm": 39.18339920043945, - "learning_rate": 1.2661125428577998e-06, - "loss": 0.4147, - "step": 57630 - }, - { - "epoch": 115.32, - "grad_norm": 0.00019836750288959593, - "learning_rate": 1.2619367091544654e-06, - "loss": 0.3769, - "step": 57660 - }, - { - "epoch": 115.38, - "grad_norm": 110.80290985107422, - "learning_rate": 1.2577667783633007e-06, - "loss": 0.3511, - "step": 57690 - }, - { - "epoch": 115.44, - "grad_norm": 38.717018127441406, - "learning_rate": 1.2536027570691938e-06, - "loss": 0.3022, - "step": 57720 - }, - { - "epoch": 115.5, - "grad_norm": 32.68162536621094, - "learning_rate": 1.2494446518477022e-06, - "loss": 0.329, - "step": 57750 - }, - { - "epoch": 115.56, - "grad_norm": 60.416648864746094, - "learning_rate": 1.2452924692650443e-06, - "loss": 0.3375, - "step": 57780 - }, - { - "epoch": 115.62, - "grad_norm": 49.8346061706543, - "learning_rate": 1.2411462158780791e-06, - "loss": 0.4005, - "step": 57810 - }, - { - "epoch": 115.68, - "grad_norm": 65.04740905761719, - "learning_rate": 1.2370058982343109e-06, - "loss": 0.3434, - "step": 57840 - }, - { - "epoch": 115.74, - "grad_norm": 87.59300994873047, - "learning_rate": 1.232871522871864e-06, - "loss": 0.4359, - "step": 57870 - }, - { - "epoch": 115.8, - "grad_norm": 36.64163589477539, - "learning_rate": 1.2287430963194807e-06, - "loss": 0.3086, - "step": 57900 - }, - { - "epoch": 115.86, - "grad_norm": 58.76565170288086, - "learning_rate": 1.2246206250965127e-06, - "loss": 0.3468, - "step": 57930 - }, - { - "epoch": 115.92, - "grad_norm": 207.4191436767578, - "learning_rate": 1.2205041157129017e-06, - "loss": 0.3749, - "step": 57960 - }, - { - "epoch": 115.98, - "grad_norm": 37.71302032470703, - "learning_rate": 1.2163935746691807e-06, - "loss": 0.3524, - "step": 57990 - }, - { - "epoch": 116.0, - "eval_loss": 0.2992992103099823, - "eval_map": 0.7868, - "eval_map_50": 0.9596, - "eval_map_75": 0.8935, - "eval_map_chicken": 0.7799, - "eval_map_duck": 0.7199, - "eval_map_large": 0.8053, - "eval_map_medium": 0.7868, - "eval_map_plant": 0.8604, - "eval_map_small": 0.3494, - "eval_mar_1": 0.3096, - "eval_mar_10": 0.8241, - "eval_mar_100": 0.8305, - "eval_mar_100_chicken": 0.8258, - "eval_mar_100_duck": 0.7691, - "eval_mar_100_plant": 0.8967, - "eval_mar_large": 0.8468, - "eval_mar_medium": 0.8306, - "eval_mar_small": 0.4462, - "eval_runtime": 13.8909, - "eval_samples_per_second": 7.199, - "eval_steps_per_second": 0.936, - "step": 58000 - }, - { - "epoch": 116.04, - "grad_norm": 118.13052368164062, - "learning_rate": 1.2122890084564542e-06, - "loss": 0.4271, - "step": 58020 - }, - { - "epoch": 116.1, - "grad_norm": 38.26741027832031, - "learning_rate": 1.2081904235563908e-06, - "loss": 0.4131, - "step": 58050 - }, - { - "epoch": 116.16, - "grad_norm": 157.98019409179688, - "learning_rate": 1.204097826441218e-06, - "loss": 0.3911, - "step": 58080 - }, - { - "epoch": 116.22, - "grad_norm": 55.6131477355957, - "learning_rate": 1.200011223573702e-06, - "loss": 0.4387, - "step": 58110 - }, - { - "epoch": 116.28, - "grad_norm": 51.9449577331543, - "learning_rate": 1.1959306214071508e-06, - "loss": 0.405, - "step": 58140 - }, - { - "epoch": 116.34, - "grad_norm": 33.6893424987793, - "learning_rate": 1.1918560263853902e-06, - "loss": 0.4189, - "step": 58170 - }, - { - "epoch": 116.4, - "grad_norm": 49.27923583984375, - "learning_rate": 1.18778744494276e-06, - "loss": 0.3933, - "step": 58200 - }, - { - "epoch": 116.46, - "grad_norm": 33.62586212158203, - "learning_rate": 1.1837248835041093e-06, - "loss": 0.4325, - "step": 58230 - }, - { - "epoch": 116.52, - "grad_norm": 41.31364440917969, - "learning_rate": 1.1796683484847731e-06, - "loss": 0.438, - "step": 58260 - }, - { - "epoch": 116.58, - "grad_norm": 35.33230972290039, - "learning_rate": 1.1756178462905782e-06, - "loss": 0.4034, - "step": 58290 - }, - { - "epoch": 116.64, - "grad_norm": 66.30696105957031, - "learning_rate": 1.1715733833178178e-06, - "loss": 0.3519, - "step": 58320 - }, - { - "epoch": 116.7, - "grad_norm": 76.4557876586914, - "learning_rate": 1.1675349659532514e-06, - "loss": 0.4278, - "step": 58350 - }, - { - "epoch": 116.76, - "grad_norm": 49.30228805541992, - "learning_rate": 1.1635026005740902e-06, - "loss": 0.412, - "step": 58380 - }, - { - "epoch": 116.82, - "grad_norm": 47.24932098388672, - "learning_rate": 1.159476293547992e-06, - "loss": 0.2973, - "step": 58410 - }, - { - "epoch": 116.88, - "grad_norm": 30.77100372314453, - "learning_rate": 1.1554560512330437e-06, - "loss": 0.2871, - "step": 58440 - }, - { - "epoch": 116.94, - "grad_norm": 70.23580932617188, - "learning_rate": 1.1514418799777554e-06, - "loss": 0.3809, - "step": 58470 - }, - { - "epoch": 117.0, - "grad_norm": 47.45207214355469, - "learning_rate": 1.1474337861210543e-06, - "loss": 0.3553, - "step": 58500 - }, - { - "epoch": 117.0, - "eval_loss": 0.2957250475883484, - "eval_map": 0.7906, - "eval_map_50": 0.9596, - "eval_map_75": 0.8967, - "eval_map_chicken": 0.7817, - "eval_map_duck": 0.7306, - "eval_map_large": 0.808, - "eval_map_medium": 0.7925, - "eval_map_plant": 0.8596, - "eval_map_small": 0.3272, - "eval_mar_1": 0.3134, - "eval_mar_10": 0.8307, - "eval_mar_100": 0.8368, - "eval_mar_100_chicken": 0.8298, - "eval_mar_100_duck": 0.7845, - "eval_mar_100_plant": 0.8961, - "eval_mar_large": 0.8503, - "eval_mar_medium": 0.8383, - "eval_mar_small": 0.4229, - "eval_runtime": 14.3775, - "eval_samples_per_second": 6.955, - "eval_steps_per_second": 0.904, - "step": 58500 - }, - { - "epoch": 117.06, - "grad_norm": 96.12175750732422, - "learning_rate": 1.1434317759922664e-06, - "loss": 0.4287, - "step": 58530 - }, - { - "epoch": 117.12, - "grad_norm": 33.77443313598633, - "learning_rate": 1.1394358559111101e-06, - "loss": 0.4672, - "step": 58560 - }, - { - "epoch": 117.18, - "grad_norm": 40.09837341308594, - "learning_rate": 1.135446032187692e-06, - "loss": 0.4058, - "step": 58590 - }, - { - "epoch": 117.24, - "grad_norm": 55.24795150756836, - "learning_rate": 1.1314623111224865e-06, - "loss": 0.3298, - "step": 58620 - }, - { - "epoch": 117.3, - "grad_norm": 45.98210906982422, - "learning_rate": 1.1274846990063314e-06, - "loss": 0.3776, - "step": 58650 - }, - { - "epoch": 117.36, - "grad_norm": 102.51956939697266, - "learning_rate": 1.1235132021204226e-06, - "loss": 0.502, - "step": 58680 - }, - { - "epoch": 117.42, - "grad_norm": 30.10770034790039, - "learning_rate": 1.1195478267362924e-06, - "loss": 0.397, - "step": 58710 - }, - { - "epoch": 117.48, - "grad_norm": 92.1784439086914, - "learning_rate": 1.1155885791158128e-06, - "loss": 0.2999, - "step": 58740 - }, - { - "epoch": 117.54, - "grad_norm": 42.1543083190918, - "learning_rate": 1.111635465511175e-06, - "loss": 0.3652, - "step": 58770 - }, - { - "epoch": 117.6, - "grad_norm": 27.44938087463379, - "learning_rate": 1.1076884921648834e-06, - "loss": 0.334, - "step": 58800 - }, - { - "epoch": 117.66, - "grad_norm": 101.73136138916016, - "learning_rate": 1.1037476653097501e-06, - "loss": 0.3323, - "step": 58830 - }, - { - "epoch": 117.72, - "grad_norm": 52.24256134033203, - "learning_rate": 1.0998129911688766e-06, - "loss": 0.3896, - "step": 58860 - }, - { - "epoch": 117.78, - "grad_norm": 47.46136474609375, - "learning_rate": 1.0958844759556525e-06, - "loss": 0.3121, - "step": 58890 - }, - { - "epoch": 117.84, - "grad_norm": 33.973873138427734, - "learning_rate": 1.0919621258737384e-06, - "loss": 0.3554, - "step": 58920 - }, - { - "epoch": 117.9, - "grad_norm": 43.18864440917969, - "learning_rate": 1.0880459471170597e-06, - "loss": 0.3597, - "step": 58950 - }, - { - "epoch": 117.96, - "grad_norm": 68.67835998535156, - "learning_rate": 1.0841359458697986e-06, - "loss": 0.3976, - "step": 58980 - }, - { - "epoch": 118.0, - "eval_loss": 0.296009361743927, - "eval_map": 0.7898, - "eval_map_50": 0.9594, - "eval_map_75": 0.8957, - "eval_map_chicken": 0.7777, - "eval_map_duck": 0.7295, - "eval_map_large": 0.8076, - "eval_map_medium": 0.7936, - "eval_map_plant": 0.8623, - "eval_map_small": 0.3654, - "eval_mar_1": 0.3122, - "eval_mar_10": 0.8276, - "eval_mar_100": 0.8337, - "eval_mar_100_chicken": 0.8262, - "eval_mar_100_duck": 0.7763, - "eval_mar_100_plant": 0.8985, - "eval_mar_large": 0.8466, - "eval_mar_medium": 0.8373, - "eval_mar_small": 0.451, - "eval_runtime": 12.1457, - "eval_samples_per_second": 8.233, - "eval_steps_per_second": 1.07, - "step": 59000 - }, - { - "epoch": 118.02, - "grad_norm": 51.64205551147461, - "learning_rate": 1.0802321283063794e-06, - "loss": 0.3503, - "step": 59010 - }, - { - "epoch": 118.08, - "grad_norm": 93.20966339111328, - "learning_rate": 1.0763345005914649e-06, - "loss": 0.3564, - "step": 59040 - }, - { - "epoch": 118.14, - "grad_norm": 143.384765625, - "learning_rate": 1.0724430688799402e-06, - "loss": 0.3468, - "step": 59070 - }, - { - "epoch": 118.2, - "grad_norm": 50.321495056152344, - "learning_rate": 1.0685578393169054e-06, - "loss": 0.3834, - "step": 59100 - }, - { - "epoch": 118.26, - "grad_norm": 58.955322265625, - "learning_rate": 1.0646788180376716e-06, - "loss": 0.5129, - "step": 59130 - }, - { - "epoch": 118.32, - "grad_norm": 50.25168228149414, - "learning_rate": 1.0608060111677409e-06, - "loss": 0.309, - "step": 59160 - }, - { - "epoch": 118.38, - "grad_norm": 64.03470611572266, - "learning_rate": 1.0569394248228026e-06, - "loss": 0.4569, - "step": 59190 - }, - { - "epoch": 118.44, - "grad_norm": 89.09526062011719, - "learning_rate": 1.053079065108728e-06, - "loss": 0.3403, - "step": 59220 - }, - { - "epoch": 118.5, - "grad_norm": 194.41836547851562, - "learning_rate": 1.049224938121548e-06, - "loss": 0.3238, - "step": 59250 - }, - { - "epoch": 118.56, - "grad_norm": 30.023624420166016, - "learning_rate": 1.0453770499474585e-06, - "loss": 0.4011, - "step": 59280 - }, - { - "epoch": 118.62, - "grad_norm": 47.413875579833984, - "learning_rate": 1.0415354066627993e-06, - "loss": 0.3756, - "step": 59310 - }, - { - "epoch": 118.68, - "grad_norm": 42.15473937988281, - "learning_rate": 1.037700014334047e-06, - "loss": 0.3933, - "step": 59340 - }, - { - "epoch": 118.74, - "grad_norm": 64.5782699584961, - "learning_rate": 1.0338708790178136e-06, - "loss": 0.3386, - "step": 59370 - }, - { - "epoch": 118.8, - "grad_norm": 85.28560638427734, - "learning_rate": 1.0300480067608232e-06, - "loss": 0.3758, - "step": 59400 - }, - { - "epoch": 118.86, - "grad_norm": 64.15291595458984, - "learning_rate": 1.026231403599915e-06, - "loss": 0.3428, - "step": 59430 - }, - { - "epoch": 118.92, - "grad_norm": 130.6211700439453, - "learning_rate": 1.0224210755620257e-06, - "loss": 0.3277, - "step": 59460 - }, - { - "epoch": 118.98, - "grad_norm": 62.73011779785156, - "learning_rate": 1.0186170286641816e-06, - "loss": 0.3359, - "step": 59490 - }, - { - "epoch": 119.0, - "eval_loss": 0.30188411474227905, - "eval_map": 0.787, - "eval_map_50": 0.9608, - "eval_map_75": 0.901, - "eval_map_chicken": 0.7713, - "eval_map_duck": 0.7276, - "eval_map_large": 0.8063, - "eval_map_medium": 0.7874, - "eval_map_plant": 0.8622, - "eval_map_small": 0.3603, - "eval_mar_1": 0.3129, - "eval_mar_10": 0.8247, - "eval_mar_100": 0.83, - "eval_mar_100_chicken": 0.8187, - "eval_mar_100_duck": 0.7753, - "eval_mar_100_plant": 0.8961, - "eval_mar_large": 0.8428, - "eval_mar_medium": 0.8295, - "eval_mar_small": 0.4529, - "eval_runtime": 14.1353, - "eval_samples_per_second": 7.074, - "eval_steps_per_second": 0.92, - "step": 59500 - }, - { - "epoch": 119.04, - "grad_norm": 159.86578369140625, - "learning_rate": 1.014819268913495e-06, - "loss": 0.3958, - "step": 59520 - }, - { - "epoch": 119.1, - "grad_norm": 101.12600708007812, - "learning_rate": 1.0110278023071445e-06, - "loss": 0.3693, - "step": 59550 - }, - { - "epoch": 119.16, - "grad_norm": 46.749698638916016, - "learning_rate": 1.0072426348323754e-06, - "loss": 0.3607, - "step": 59580 - }, - { - "epoch": 119.22, - "grad_norm": 57.13641357421875, - "learning_rate": 1.0034637724664832e-06, - "loss": 0.3197, - "step": 59610 - }, - { - "epoch": 119.28, - "grad_norm": 43.5272216796875, - "learning_rate": 9.99691221176805e-07, - "loss": 0.2973, - "step": 59640 - }, - { - "epoch": 119.34, - "grad_norm": 96.45797729492188, - "learning_rate": 9.959249869207177e-07, - "loss": 0.3693, - "step": 59670 - }, - { - "epoch": 119.4, - "grad_norm": 93.45145416259766, - "learning_rate": 9.921650756456164e-07, - "loss": 0.396, - "step": 59700 - }, - { - "epoch": 119.46, - "grad_norm": 81.01191711425781, - "learning_rate": 9.884114932889172e-07, - "loss": 0.3534, - "step": 59730 - }, - { - "epoch": 119.52, - "grad_norm": 33.083866119384766, - "learning_rate": 9.84664245778037e-07, - "loss": 0.316, - "step": 59760 - }, - { - "epoch": 119.58, - "grad_norm": 40.107078552246094, - "learning_rate": 9.809233390303901e-07, - "loss": 0.4417, - "step": 59790 - }, - { - "epoch": 119.64, - "grad_norm": 60.68373107910156, - "learning_rate": 9.771887789533818e-07, - "loss": 0.3847, - "step": 59820 - }, - { - "epoch": 119.7, - "grad_norm": 26.99202537536621, - "learning_rate": 9.734605714443906e-07, - "loss": 0.3442, - "step": 59850 - }, - { - "epoch": 119.76, - "grad_norm": 27.286752700805664, - "learning_rate": 9.69738722390765e-07, - "loss": 0.3815, - "step": 59880 - }, - { - "epoch": 119.82, - "grad_norm": 119.09711456298828, - "learning_rate": 9.66023237669812e-07, - "loss": 0.3455, - "step": 59910 - }, - { - "epoch": 119.88, - "grad_norm": 58.220664978027344, - "learning_rate": 9.623141231487904e-07, - "loss": 0.3299, - "step": 59940 - }, - { - "epoch": 119.94, - "grad_norm": 46.67108917236328, - "learning_rate": 9.586113846848982e-07, - "loss": 0.391, - "step": 59970 - }, - { - "epoch": 120.0, - "grad_norm": 66.8419418334961, - "learning_rate": 9.549150281252633e-07, - "loss": 0.3539, - "step": 60000 - }, - { - "epoch": 120.0, - "eval_loss": 0.29548418521881104, - "eval_map": 0.791, - "eval_map_50": 0.9618, - "eval_map_75": 0.8983, - "eval_map_chicken": 0.7759, - "eval_map_duck": 0.7341, - "eval_map_large": 0.809, - "eval_map_medium": 0.7919, - "eval_map_plant": 0.8629, - "eval_map_small": 0.346, - "eval_mar_1": 0.3134, - "eval_mar_10": 0.828, - "eval_mar_100": 0.8339, - "eval_mar_100_chicken": 0.8234, - "eval_mar_100_duck": 0.7804, - "eval_mar_100_plant": 0.8979, - "eval_mar_large": 0.8467, - "eval_mar_medium": 0.8337, - "eval_mar_small": 0.4557, - "eval_runtime": 12.9494, - "eval_samples_per_second": 7.722, - "eval_steps_per_second": 1.004, - "step": 60000 - }, - { - "epoch": 120.06, - "grad_norm": 53.99040603637695, - "learning_rate": 9.512250593069394e-07, - "loss": 0.3768, - "step": 60030 - }, - { - "epoch": 120.12, - "grad_norm": 45.8270378112793, - "learning_rate": 9.475414840568903e-07, - "loss": 0.3543, - "step": 60060 - }, - { - "epoch": 120.18, - "grad_norm": 183.52630615234375, - "learning_rate": 9.438643081919818e-07, - "loss": 0.3369, - "step": 60090 - }, - { - "epoch": 120.24, - "grad_norm": 87.49842071533203, - "learning_rate": 9.401935375189802e-07, - "loss": 0.3055, - "step": 60120 - }, - { - "epoch": 120.3, - "grad_norm": 0.0009844176238402724, - "learning_rate": 9.365291778345303e-07, - "loss": 0.3699, - "step": 60150 - }, - { - "epoch": 120.36, - "grad_norm": 73.72267150878906, - "learning_rate": 9.32871234925159e-07, - "loss": 0.3816, - "step": 60180 - }, - { - "epoch": 120.42, - "grad_norm": 64.15357208251953, - "learning_rate": 9.29219714567256e-07, - "loss": 0.3545, - "step": 60210 - }, - { - "epoch": 120.48, - "grad_norm": 99.92349243164062, - "learning_rate": 9.255746225270689e-07, - "loss": 0.3186, - "step": 60240 - }, - { - "epoch": 120.54, - "grad_norm": 45.437252044677734, - "learning_rate": 9.21935964560699e-07, - "loss": 0.438, - "step": 60270 - }, - { - "epoch": 120.6, - "grad_norm": 9.287581633543596e-05, - "learning_rate": 9.183037464140804e-07, - "loss": 0.3379, - "step": 60300 - }, - { - "epoch": 120.66, - "grad_norm": 70.52328491210938, - "learning_rate": 9.146779738229838e-07, - "loss": 0.4137, - "step": 60330 - }, - { - "epoch": 120.72, - "grad_norm": 45.03104019165039, - "learning_rate": 9.110586525129988e-07, - "loss": 0.3361, - "step": 60360 - }, - { - "epoch": 120.78, - "grad_norm": 51.95904541015625, - "learning_rate": 9.074457881995252e-07, - "loss": 0.378, - "step": 60390 - }, - { - "epoch": 120.84, - "grad_norm": 76.6165542602539, - "learning_rate": 9.038393865877725e-07, - "loss": 0.3417, - "step": 60420 - }, - { - "epoch": 120.9, - "grad_norm": 32.872440338134766, - "learning_rate": 9.002394533727382e-07, - "loss": 0.3922, - "step": 60450 - }, - { - "epoch": 120.96, - "grad_norm": 33.17911148071289, - "learning_rate": 8.966459942392108e-07, - "loss": 0.3807, - "step": 60480 - }, - { - "epoch": 121.0, - "eval_loss": 0.29254433512687683, - "eval_map": 0.7959, - "eval_map_50": 0.9593, - "eval_map_75": 0.894, - "eval_map_chicken": 0.7827, - "eval_map_duck": 0.7384, - "eval_map_large": 0.8155, - "eval_map_medium": 0.7973, - "eval_map_plant": 0.8665, - "eval_map_small": 0.3381, - "eval_mar_1": 0.3171, - "eval_mar_10": 0.834, - "eval_mar_100": 0.8391, - "eval_mar_100_chicken": 0.8321, - "eval_mar_100_duck": 0.7856, - "eval_mar_100_plant": 0.8997, - "eval_mar_large": 0.8493, - "eval_mar_medium": 0.8399, - "eval_mar_small": 0.4519, - "eval_runtime": 13.8422, - "eval_samples_per_second": 7.224, - "eval_steps_per_second": 0.939, - "step": 60500 - }, - { - "epoch": 121.02, - "grad_norm": 75.32990264892578, - "learning_rate": 8.930590148617513e-07, - "loss": 0.3599, - "step": 60510 - }, - { - "epoch": 121.08, - "grad_norm": 50.39398956298828, - "learning_rate": 8.894785209046886e-07, - "loss": 0.3459, - "step": 60540 - }, - { - "epoch": 121.14, - "grad_norm": 7.005995576037094e-05, - "learning_rate": 8.859045180221137e-07, - "loss": 0.332, - "step": 60570 - }, - { - "epoch": 121.2, - "grad_norm": 44.23671340942383, - "learning_rate": 8.823370118578628e-07, - "loss": 0.3197, - "step": 60600 - }, - { - "epoch": 121.26, - "grad_norm": 102.2528305053711, - "learning_rate": 8.787760080455171e-07, - "loss": 0.3731, - "step": 60630 - }, - { - "epoch": 121.32, - "grad_norm": 27.199970245361328, - "learning_rate": 8.752215122083874e-07, - "loss": 0.3436, - "step": 60660 - }, - { - "epoch": 121.38, - "grad_norm": 59.93872833251953, - "learning_rate": 8.716735299595059e-07, - "loss": 0.4162, - "step": 60690 - }, - { - "epoch": 121.44, - "grad_norm": 8.24006856419146e-05, - "learning_rate": 8.68132066901623e-07, - "loss": 0.4192, - "step": 60720 - }, - { - "epoch": 121.5, - "grad_norm": 61.620506286621094, - "learning_rate": 8.645971286271903e-07, - "loss": 0.3545, - "step": 60750 - }, - { - "epoch": 121.56, - "grad_norm": 30.510093688964844, - "learning_rate": 8.610687207183604e-07, - "loss": 0.3393, - "step": 60780 - }, - { - "epoch": 121.62, - "grad_norm": 32.98684310913086, - "learning_rate": 8.575468487469696e-07, - "loss": 0.4148, - "step": 60810 - }, - { - "epoch": 121.68, - "grad_norm": 54.892974853515625, - "learning_rate": 8.540315182745329e-07, - "loss": 0.4938, - "step": 60840 - }, - { - "epoch": 121.74, - "grad_norm": 58.480010986328125, - "learning_rate": 8.505227348522404e-07, - "loss": 0.4128, - "step": 60870 - }, - { - "epoch": 121.8, - "grad_norm": 46.77655792236328, - "learning_rate": 8.470205040209362e-07, - "loss": 0.3208, - "step": 60900 - }, - { - "epoch": 121.86, - "grad_norm": 149.3266143798828, - "learning_rate": 8.435248313111244e-07, - "loss": 0.4722, - "step": 60930 - }, - { - "epoch": 121.92, - "grad_norm": 143.2934112548828, - "learning_rate": 8.400357222429473e-07, - "loss": 0.3419, - "step": 60960 - }, - { - "epoch": 121.98, - "grad_norm": 166.79092407226562, - "learning_rate": 8.365531823261841e-07, - "loss": 0.3657, - "step": 60990 - }, - { - "epoch": 122.0, - "eval_loss": 0.3005896806716919, - "eval_map": 0.7916, - "eval_map_50": 0.9634, - "eval_map_75": 0.8955, - "eval_map_chicken": 0.7768, - "eval_map_duck": 0.7377, - "eval_map_large": 0.8187, - "eval_map_medium": 0.7899, - "eval_map_plant": 0.8604, - "eval_map_small": 0.3356, - "eval_mar_1": 0.3182, - "eval_mar_10": 0.8276, - "eval_mar_100": 0.8345, - "eval_mar_100_chicken": 0.8242, - "eval_mar_100_duck": 0.7835, - "eval_mar_100_plant": 0.8958, - "eval_mar_large": 0.8516, - "eval_mar_medium": 0.834, - "eval_mar_small": 0.4352, - "eval_runtime": 12.9954, - "eval_samples_per_second": 7.695, - "eval_steps_per_second": 1.0, - "step": 61000 - }, - { - "epoch": 122.04, - "grad_norm": 46.02410125732422, - "learning_rate": 8.330772170602424e-07, - "loss": 0.3836, - "step": 61020 - }, - { - "epoch": 122.1, - "grad_norm": 55.28064727783203, - "learning_rate": 8.296078319341444e-07, - "loss": 0.3722, - "step": 61050 - }, - { - "epoch": 122.16, - "grad_norm": 97.92649841308594, - "learning_rate": 8.261450324265225e-07, - "loss": 0.3995, - "step": 61080 - }, - { - "epoch": 122.22, - "grad_norm": 42.298309326171875, - "learning_rate": 8.226888240056114e-07, - "loss": 0.4435, - "step": 61110 - }, - { - "epoch": 122.28, - "grad_norm": 50.94303894042969, - "learning_rate": 8.192392121292336e-07, - "loss": 0.3301, - "step": 61140 - }, - { - "epoch": 122.34, - "grad_norm": 136.8793487548828, - "learning_rate": 8.157962022448001e-07, - "loss": 0.3758, - "step": 61170 - }, - { - "epoch": 122.4, - "grad_norm": 71.58943939208984, - "learning_rate": 8.123597997892918e-07, - "loss": 0.3393, - "step": 61200 - }, - { - "epoch": 122.46, - "grad_norm": 57.700557708740234, - "learning_rate": 8.089300101892561e-07, - "loss": 0.3534, - "step": 61230 - }, - { - "epoch": 122.52, - "grad_norm": 95.97938537597656, - "learning_rate": 8.055068388608011e-07, - "loss": 0.4093, - "step": 61260 - }, - { - "epoch": 122.58, - "grad_norm": 24.18108367919922, - "learning_rate": 8.020902912095807e-07, - "loss": 0.4185, - "step": 61290 - }, - { - "epoch": 122.64, - "grad_norm": 39.89807891845703, - "learning_rate": 7.986803726307901e-07, - "loss": 0.2931, - "step": 61320 - }, - { - "epoch": 122.7, - "grad_norm": 84.0215072631836, - "learning_rate": 7.952770885091548e-07, - "loss": 0.4033, - "step": 61350 - }, - { - "epoch": 122.76, - "grad_norm": 58.67879104614258, - "learning_rate": 7.918804442189271e-07, - "loss": 0.4203, - "step": 61380 - }, - { - "epoch": 122.82, - "grad_norm": 15.713956832885742, - "learning_rate": 7.884904451238712e-07, - "loss": 0.3599, - "step": 61410 - }, - { - "epoch": 122.88, - "grad_norm": 38.39372634887695, - "learning_rate": 7.851070965772572e-07, - "loss": 0.3012, - "step": 61440 - }, - { - "epoch": 122.94, - "grad_norm": 105.68817138671875, - "learning_rate": 7.81730403921856e-07, - "loss": 0.3878, - "step": 61470 - }, - { - "epoch": 123.0, - "grad_norm": 44.60169219970703, - "learning_rate": 7.783603724899258e-07, - "loss": 0.3388, - "step": 61500 - }, - { - "epoch": 123.0, - "eval_loss": 0.29849478602409363, - "eval_map": 0.7894, - "eval_map_50": 0.9631, - "eval_map_75": 0.8973, - "eval_map_chicken": 0.7735, - "eval_map_duck": 0.7316, - "eval_map_large": 0.8084, - "eval_map_medium": 0.7913, - "eval_map_plant": 0.8629, - "eval_map_small": 0.3342, - "eval_mar_1": 0.3131, - "eval_mar_10": 0.8275, - "eval_mar_100": 0.833, - "eval_mar_100_chicken": 0.8206, - "eval_mar_100_duck": 0.7814, - "eval_mar_100_plant": 0.897, - "eval_mar_large": 0.8481, - "eval_mar_medium": 0.8346, - "eval_mar_small": 0.44, - "eval_runtime": 13.9696, - "eval_samples_per_second": 7.158, - "eval_steps_per_second": 0.931, - "step": 61500 - }, - { - "epoch": 123.06, - "grad_norm": 99.0871810913086, - "learning_rate": 7.749970076032048e-07, - "loss": 0.318, - "step": 61530 - }, - { - "epoch": 123.12, - "grad_norm": 143.69134521484375, - "learning_rate": 7.716403145729073e-07, - "loss": 0.3372, - "step": 61560 - }, - { - "epoch": 123.18, - "grad_norm": 7.875735173001885e-05, - "learning_rate": 7.682902986997076e-07, - "loss": 0.4084, - "step": 61590 - }, - { - "epoch": 123.24, - "grad_norm": 93.30904388427734, - "learning_rate": 7.649469652737407e-07, - "loss": 0.3368, - "step": 61620 - }, - { - "epoch": 123.3, - "grad_norm": 46.52485275268555, - "learning_rate": 7.61610319574585e-07, - "loss": 0.3304, - "step": 61650 - }, - { - "epoch": 123.36, - "grad_norm": 118.18556213378906, - "learning_rate": 7.582803668712579e-07, - "loss": 0.3169, - "step": 61680 - }, - { - "epoch": 123.42, - "grad_norm": 38.636016845703125, - "learning_rate": 7.549571124222127e-07, - "loss": 0.428, - "step": 61710 - }, - { - "epoch": 123.48, - "grad_norm": 79.80267333984375, - "learning_rate": 7.51640561475318e-07, - "loss": 0.4249, - "step": 61740 - }, - { - "epoch": 123.54, - "grad_norm": 40.69455337524414, - "learning_rate": 7.48330719267864e-07, - "loss": 0.3385, - "step": 61770 - }, - { - "epoch": 123.6, - "grad_norm": 43.14628219604492, - "learning_rate": 7.450275910265415e-07, - "loss": 0.3611, - "step": 61800 - }, - { - "epoch": 123.66, - "grad_norm": 83.33329010009766, - "learning_rate": 7.4173118196744e-07, - "loss": 0.3173, - "step": 61830 - }, - { - "epoch": 123.72, - "grad_norm": 52.423152923583984, - "learning_rate": 7.384414972960419e-07, - "loss": 0.5249, - "step": 61860 - }, - { - "epoch": 123.78, - "grad_norm": 42.12984848022461, - "learning_rate": 7.351585422072049e-07, - "loss": 0.4306, - "step": 61890 - }, - { - "epoch": 123.84, - "grad_norm": 137.32691955566406, - "learning_rate": 7.318823218851668e-07, - "loss": 0.2652, - "step": 61920 - }, - { - "epoch": 123.9, - "grad_norm": 92.33072662353516, - "learning_rate": 7.286128415035249e-07, - "loss": 0.3685, - "step": 61950 - }, - { - "epoch": 123.96, - "grad_norm": 54.6385612487793, - "learning_rate": 7.253501062252338e-07, - "loss": 0.3234, - "step": 61980 - }, - { - "epoch": 124.0, - "eval_loss": 0.29493066668510437, - "eval_map": 0.7951, - "eval_map_50": 0.9601, - "eval_map_75": 0.8963, - "eval_map_chicken": 0.7824, - "eval_map_duck": 0.7392, - "eval_map_large": 0.8059, - "eval_map_medium": 0.7999, - "eval_map_plant": 0.8636, - "eval_map_small": 0.3344, - "eval_mar_1": 0.3156, - "eval_mar_10": 0.8322, - "eval_mar_100": 0.8381, - "eval_mar_100_chicken": 0.8306, - "eval_mar_100_duck": 0.7845, - "eval_mar_100_plant": 0.8991, - "eval_mar_large": 0.8458, - "eval_mar_medium": 0.8401, - "eval_mar_small": 0.4452, - "eval_runtime": 13.1519, - "eval_samples_per_second": 7.603, - "eval_steps_per_second": 0.988, - "step": 62000 - }, - { - "epoch": 124.02, - "grad_norm": 56.340145111083984, - "learning_rate": 7.220941212026005e-07, - "loss": 0.4014, - "step": 62010 - }, - { - "epoch": 124.08, - "grad_norm": 51.8863639831543, - "learning_rate": 7.188448915772673e-07, - "loss": 0.3636, - "step": 62040 - }, - { - "epoch": 124.14, - "grad_norm": 78.32695007324219, - "learning_rate": 7.156024224802139e-07, - "loss": 0.3389, - "step": 62070 - }, - { - "epoch": 124.2, - "grad_norm": 30.821731567382812, - "learning_rate": 7.123667190317396e-07, - "loss": 0.3596, - "step": 62100 - }, - { - "epoch": 124.26, - "grad_norm": 86.81900787353516, - "learning_rate": 7.091377863414611e-07, - "loss": 0.3607, - "step": 62130 - }, - { - "epoch": 124.32, - "grad_norm": 44.02219009399414, - "learning_rate": 7.059156295083064e-07, - "loss": 0.3836, - "step": 62160 - }, - { - "epoch": 124.38, - "grad_norm": 61.75017547607422, - "learning_rate": 7.027002536204986e-07, - "loss": 0.4119, - "step": 62190 - }, - { - "epoch": 124.44, - "grad_norm": 33.044376373291016, - "learning_rate": 6.994916637555571e-07, - "loss": 0.3634, - "step": 62220 - }, - { - "epoch": 124.5, - "grad_norm": 80.2425308227539, - "learning_rate": 6.962898649802824e-07, - "loss": 0.2843, - "step": 62250 - }, - { - "epoch": 124.56, - "grad_norm": 59.19382858276367, - "learning_rate": 6.930948623507505e-07, - "loss": 0.3495, - "step": 62280 - }, - { - "epoch": 124.62, - "grad_norm": 52.384849548339844, - "learning_rate": 6.89906660912309e-07, - "loss": 0.3775, - "step": 62310 - }, - { - "epoch": 124.68, - "grad_norm": 46.481658935546875, - "learning_rate": 6.86725265699561e-07, - "loss": 0.329, - "step": 62340 - }, - { - "epoch": 124.74, - "grad_norm": 64.0755386352539, - "learning_rate": 6.835506817363657e-07, - "loss": 0.3089, - "step": 62370 - }, - { - "epoch": 124.8, - "grad_norm": 123.5768814086914, - "learning_rate": 6.803829140358237e-07, - "loss": 0.3505, - "step": 62400 - }, - { - "epoch": 124.86, - "grad_norm": 161.73182678222656, - "learning_rate": 6.772219676002717e-07, - "loss": 0.3278, - "step": 62430 - }, - { - "epoch": 124.92, - "grad_norm": 78.50151824951172, - "learning_rate": 6.74067847421277e-07, - "loss": 0.3474, - "step": 62460 - }, - { - "epoch": 124.98, - "grad_norm": 126.38793182373047, - "learning_rate": 6.709205584796241e-07, - "loss": 0.341, - "step": 62490 - }, - { - "epoch": 125.0, - "eval_loss": 0.29178693890571594, - "eval_map": 0.7977, - "eval_map_50": 0.964, - "eval_map_75": 0.9012, - "eval_map_chicken": 0.783, - "eval_map_duck": 0.7453, - "eval_map_large": 0.82, - "eval_map_medium": 0.8003, - "eval_map_plant": 0.8647, - "eval_map_small": 0.3369, - "eval_mar_1": 0.3165, - "eval_mar_10": 0.836, - "eval_mar_100": 0.8414, - "eval_mar_100_chicken": 0.8294, - "eval_mar_100_duck": 0.7948, - "eval_mar_100_plant": 0.9, - "eval_mar_large": 0.8564, - "eval_mar_medium": 0.8434, - "eval_mar_small": 0.4419, - "eval_runtime": 13.1198, - "eval_samples_per_second": 7.622, - "eval_steps_per_second": 0.991, - "step": 62500 - }, - { - "epoch": 125.04, - "grad_norm": 121.4775619506836, - "learning_rate": 6.677801057453143e-07, - "loss": 0.3543, - "step": 62520 - }, - { - "epoch": 125.1, - "grad_norm": 61.96651077270508, - "learning_rate": 6.646464941775499e-07, - "loss": 0.3352, - "step": 62550 - }, - { - "epoch": 125.16, - "grad_norm": 52.88582992553711, - "learning_rate": 6.615197287247299e-07, - "loss": 0.2526, - "step": 62580 - }, - { - "epoch": 125.22, - "grad_norm": 9.414328815182671e-05, - "learning_rate": 6.583998143244463e-07, - "loss": 0.302, - "step": 62610 - }, - { - "epoch": 125.28, - "grad_norm": 116.23927307128906, - "learning_rate": 6.552867559034687e-07, - "loss": 0.3437, - "step": 62640 - }, - { - "epoch": 125.34, - "grad_norm": 46.484642028808594, - "learning_rate": 6.521805583777396e-07, - "loss": 0.3909, - "step": 62670 - }, - { - "epoch": 125.4, - "grad_norm": 38.19538879394531, - "learning_rate": 6.490812266523716e-07, - "loss": 0.3869, - "step": 62700 - }, - { - "epoch": 125.46, - "grad_norm": 34.6130256652832, - "learning_rate": 6.459887656216318e-07, - "loss": 0.35, - "step": 62730 - }, - { - "epoch": 125.52, - "grad_norm": 43.729305267333984, - "learning_rate": 6.429031801689362e-07, - "loss": 0.464, - "step": 62760 - }, - { - "epoch": 125.58, - "grad_norm": 60.23460006713867, - "learning_rate": 6.398244751668481e-07, - "loss": 0.3092, - "step": 62790 - }, - { - "epoch": 125.64, - "grad_norm": 45.13640594482422, - "learning_rate": 6.36752655477062e-07, - "loss": 0.3121, - "step": 62820 - }, - { - "epoch": 125.7, - "grad_norm": 64.78380584716797, - "learning_rate": 6.336877259504004e-07, - "loss": 0.3658, - "step": 62850 - }, - { - "epoch": 125.76, - "grad_norm": 76.02064514160156, - "learning_rate": 6.30629691426804e-07, - "loss": 0.4133, - "step": 62880 - }, - { - "epoch": 125.82, - "grad_norm": 190.0027313232422, - "learning_rate": 6.275785567353293e-07, - "loss": 0.3969, - "step": 62910 - }, - { - "epoch": 125.88, - "grad_norm": 53.93574905395508, - "learning_rate": 6.245343266941328e-07, - "loss": 0.3821, - "step": 62940 - }, - { - "epoch": 125.94, - "grad_norm": 68.3726577758789, - "learning_rate": 6.214970061104686e-07, - "loss": 0.3249, - "step": 62970 - }, - { - "epoch": 126.0, - "grad_norm": 59.181270599365234, - "learning_rate": 6.184665997806832e-07, - "loss": 0.3289, - "step": 63000 - }, - { - "epoch": 126.0, - "eval_loss": 0.2899820804595947, - "eval_map": 0.8004, - "eval_map_50": 0.9627, - "eval_map_75": 0.904, - "eval_map_chicken": 0.7823, - "eval_map_duck": 0.7492, - "eval_map_large": 0.823, - "eval_map_medium": 0.8034, - "eval_map_plant": 0.8698, - "eval_map_small": 0.3378, - "eval_mar_1": 0.3186, - "eval_mar_10": 0.8403, - "eval_mar_100": 0.8461, - "eval_mar_100_chicken": 0.8329, - "eval_mar_100_duck": 0.8031, - "eval_mar_100_plant": 0.9021, - "eval_mar_large": 0.8596, - "eval_mar_medium": 0.8482, - "eval_mar_small": 0.4452, - "eval_runtime": 11.9663, - "eval_samples_per_second": 8.357, - "eval_steps_per_second": 1.086, - "step": 63000 - }, - { - "epoch": 126.06, - "grad_norm": 32.981258392333984, - "learning_rate": 6.154431124901983e-07, - "loss": 0.4104, - "step": 63030 - }, - { - "epoch": 126.12, - "grad_norm": 65.4036636352539, - "learning_rate": 6.124265490135161e-07, - "loss": 0.3999, - "step": 63060 - }, - { - "epoch": 126.18, - "grad_norm": 76.22710418701172, - "learning_rate": 6.094169141142014e-07, - "loss": 0.3464, - "step": 63090 - }, - { - "epoch": 126.24, - "grad_norm": 64.0662841796875, - "learning_rate": 6.064142125448763e-07, - "loss": 0.3239, - "step": 63120 - }, - { - "epoch": 126.3, - "grad_norm": 35.752437591552734, - "learning_rate": 6.034184490472195e-07, - "loss": 0.3733, - "step": 63150 - }, - { - "epoch": 126.36, - "grad_norm": 136.5454864501953, - "learning_rate": 6.004296283519478e-07, - "loss": 0.3767, - "step": 63180 - }, - { - "epoch": 126.42, - "grad_norm": 66.61968231201172, - "learning_rate": 5.974477551788194e-07, - "loss": 0.3702, - "step": 63210 - }, - { - "epoch": 126.48, - "grad_norm": 108.3598403930664, - "learning_rate": 5.944728342366179e-07, - "loss": 0.3706, - "step": 63240 - }, - { - "epoch": 126.54, - "grad_norm": 58.992515563964844, - "learning_rate": 5.915048702231491e-07, - "loss": 0.3487, - "step": 63270 - }, - { - "epoch": 126.6, - "grad_norm": 73.31640625, - "learning_rate": 5.885438678252342e-07, - "loss": 0.3358, - "step": 63300 - }, - { - "epoch": 126.66, - "grad_norm": 39.52558517456055, - "learning_rate": 5.855898317186992e-07, - "loss": 0.3686, - "step": 63330 - }, - { - "epoch": 126.72, - "grad_norm": 36.256874084472656, - "learning_rate": 5.826427665683715e-07, - "loss": 0.3185, - "step": 63360 - }, - { - "epoch": 126.78, - "grad_norm": 38.929039001464844, - "learning_rate": 5.797026770280683e-07, - "loss": 0.3652, - "step": 63390 - }, - { - "epoch": 126.84, - "grad_norm": 65.80767822265625, - "learning_rate": 5.767695677405921e-07, - "loss": 0.3059, - "step": 63420 - }, - { - "epoch": 126.9, - "grad_norm": 76.24812316894531, - "learning_rate": 5.738434433377244e-07, - "loss": 0.3191, - "step": 63450 - }, - { - "epoch": 126.96, - "grad_norm": 30.609939575195312, - "learning_rate": 5.709243084402128e-07, - "loss": 0.3619, - "step": 63480 - }, - { - "epoch": 127.0, - "eval_loss": 0.29183581471443176, - "eval_map": 0.7985, - "eval_map_50": 0.9625, - "eval_map_75": 0.8978, - "eval_map_chicken": 0.7839, - "eval_map_duck": 0.745, - "eval_map_large": 0.8171, - "eval_map_medium": 0.804, - "eval_map_plant": 0.8668, - "eval_map_small": 0.3304, - "eval_mar_1": 0.3174, - "eval_mar_10": 0.8368, - "eval_mar_100": 0.8421, - "eval_mar_100_chicken": 0.8294, - "eval_mar_100_duck": 0.7969, - "eval_mar_100_plant": 0.9, - "eval_mar_large": 0.855, - "eval_mar_medium": 0.8459, - "eval_mar_small": 0.4114, - "eval_runtime": 13.5585, - "eval_samples_per_second": 7.375, - "eval_steps_per_second": 0.959, - "step": 63500 - }, - { - "epoch": 127.02, - "grad_norm": 32.957435607910156, - "learning_rate": 5.680121676577721e-07, - "loss": 0.3466, - "step": 63510 - }, - { - "epoch": 127.08, - "grad_norm": 8.321553468704224e-05, - "learning_rate": 5.651070255890689e-07, - "loss": 0.3952, - "step": 63540 - }, - { - "epoch": 127.14, - "grad_norm": 44.196449279785156, - "learning_rate": 5.622088868217179e-07, - "loss": 0.4008, - "step": 63570 - }, - { - "epoch": 127.2, - "grad_norm": 31.003173828125, - "learning_rate": 5.593177559322776e-07, - "loss": 0.3913, - "step": 63600 - }, - { - "epoch": 127.26, - "grad_norm": 58.132354736328125, - "learning_rate": 5.564336374862373e-07, - "loss": 0.3001, - "step": 63630 - }, - { - "epoch": 127.32, - "grad_norm": 81.96055603027344, - "learning_rate": 5.535565360380146e-07, - "loss": 0.2915, - "step": 63660 - }, - { - "epoch": 127.38, - "grad_norm": 141.5048370361328, - "learning_rate": 5.506864561309455e-07, - "loss": 0.3209, - "step": 63690 - }, - { - "epoch": 127.44, - "grad_norm": 39.172306060791016, - "learning_rate": 5.478234022972756e-07, - "loss": 0.4754, - "step": 63720 - }, - { - "epoch": 127.5, - "grad_norm": 40.754241943359375, - "learning_rate": 5.449673790581611e-07, - "loss": 0.3568, - "step": 63750 - }, - { - "epoch": 127.56, - "grad_norm": 37.0576286315918, - "learning_rate": 5.421183909236494e-07, - "loss": 0.3897, - "step": 63780 - }, - { - "epoch": 127.62, - "grad_norm": 68.6433334350586, - "learning_rate": 5.392764423926844e-07, - "loss": 0.3309, - "step": 63810 - }, - { - "epoch": 127.68, - "grad_norm": 54.752647399902344, - "learning_rate": 5.364415379530891e-07, - "loss": 0.3066, - "step": 63840 - }, - { - "epoch": 127.74, - "grad_norm": 39.858787536621094, - "learning_rate": 5.33613682081564e-07, - "loss": 0.3913, - "step": 63870 - }, - { - "epoch": 127.8, - "grad_norm": 38.397804260253906, - "learning_rate": 5.307928792436812e-07, - "loss": 0.291, - "step": 63900 - }, - { - "epoch": 127.86, - "grad_norm": 61.00391387939453, - "learning_rate": 5.279791338938717e-07, - "loss": 0.3015, - "step": 63930 - }, - { - "epoch": 127.92, - "grad_norm": 23.472204208374023, - "learning_rate": 5.251724504754258e-07, - "loss": 0.3911, - "step": 63960 - }, - { - "epoch": 127.98, - "grad_norm": 39.998695373535156, - "learning_rate": 5.22372833420478e-07, - "loss": 0.3725, - "step": 63990 - }, - { - "epoch": 128.0, - "eval_loss": 0.29072773456573486, - "eval_map": 0.7956, - "eval_map_50": 0.9634, - "eval_map_75": 0.8987, - "eval_map_chicken": 0.7829, - "eval_map_duck": 0.7403, - "eval_map_large": 0.8105, - "eval_map_medium": 0.8023, - "eval_map_plant": 0.8636, - "eval_map_small": 0.3324, - "eval_mar_1": 0.3157, - "eval_mar_10": 0.8345, - "eval_mar_100": 0.8401, - "eval_mar_100_chicken": 0.8266, - "eval_mar_100_duck": 0.7948, - "eval_mar_100_plant": 0.8988, - "eval_mar_large": 0.8508, - "eval_mar_medium": 0.8446, - "eval_mar_small": 0.4267, - "eval_runtime": 14.3016, - "eval_samples_per_second": 6.992, - "eval_steps_per_second": 0.909, - "step": 64000 - }, - { - "epoch": 128.04, - "grad_norm": 57.42071533203125, - "learning_rate": 5.19580287150005e-07, - "loss": 0.4087, - "step": 64020 - }, - { - "epoch": 128.1, - "grad_norm": 48.32342529296875, - "learning_rate": 5.167948160738206e-07, - "loss": 0.3399, - "step": 64050 - }, - { - "epoch": 128.16, - "grad_norm": 157.54129028320312, - "learning_rate": 5.140164245905633e-07, - "loss": 0.3768, - "step": 64080 - }, - { - "epoch": 128.22, - "grad_norm": 45.331077575683594, - "learning_rate": 5.112451170876903e-07, - "loss": 0.3629, - "step": 64110 - }, - { - "epoch": 128.28, - "grad_norm": 65.87416076660156, - "learning_rate": 5.084808979414779e-07, - "loss": 0.4392, - "step": 64140 - }, - { - "epoch": 128.34, - "grad_norm": 50.307708740234375, - "learning_rate": 5.057237715170032e-07, - "loss": 0.3833, - "step": 64170 - }, - { - "epoch": 128.4, - "grad_norm": 51.025508880615234, - "learning_rate": 5.029737421681446e-07, - "loss": 0.2941, - "step": 64200 - }, - { - "epoch": 128.46, - "grad_norm": 6.70941371936351e-05, - "learning_rate": 5.002308142375762e-07, - "loss": 0.3574, - "step": 64230 - }, - { - "epoch": 128.52, - "grad_norm": 39.82708740234375, - "learning_rate": 4.97494992056754e-07, - "loss": 0.4264, - "step": 64260 - }, - { - "epoch": 128.58, - "grad_norm": 50.79159927368164, - "learning_rate": 4.947662799459152e-07, - "loss": 0.4255, - "step": 64290 - }, - { - "epoch": 128.64, - "grad_norm": 51.88654708862305, - "learning_rate": 4.920446822140673e-07, - "loss": 0.361, - "step": 64320 - }, - { - "epoch": 128.7, - "grad_norm": 193.65829467773438, - "learning_rate": 4.893302031589864e-07, - "loss": 0.3327, - "step": 64350 - }, - { - "epoch": 128.76, - "grad_norm": 41.31486511230469, - "learning_rate": 4.866228470672041e-07, - "loss": 0.3462, - "step": 64380 - }, - { - "epoch": 128.82, - "grad_norm": 37.94261169433594, - "learning_rate": 4.839226182140072e-07, - "loss": 0.3831, - "step": 64410 - }, - { - "epoch": 128.88, - "grad_norm": 47.26423263549805, - "learning_rate": 4.812295208634238e-07, - "loss": 0.3016, - "step": 64440 - }, - { - "epoch": 128.94, - "grad_norm": 282.98797607421875, - "learning_rate": 4.78543559268222e-07, - "loss": 0.3769, - "step": 64470 - }, - { - "epoch": 129.0, - "grad_norm": 59.48456954956055, - "learning_rate": 4.758647376699033e-07, - "loss": 0.3488, - "step": 64500 - }, - { - "epoch": 129.0, - "eval_loss": 0.2899148166179657, - "eval_map": 0.7982, - "eval_map_50": 0.9623, - "eval_map_75": 0.8974, - "eval_map_chicken": 0.7821, - "eval_map_duck": 0.7478, - "eval_map_large": 0.8123, - "eval_map_medium": 0.8049, - "eval_map_plant": 0.8647, - "eval_map_small": 0.3311, - "eval_mar_1": 0.3171, - "eval_mar_10": 0.8372, - "eval_mar_100": 0.8432, - "eval_mar_100_chicken": 0.8298, - "eval_mar_100_duck": 0.8, - "eval_mar_100_plant": 0.8997, - "eval_mar_large": 0.8514, - "eval_mar_medium": 0.8481, - "eval_mar_small": 0.4352, - "eval_runtime": 14.298, - "eval_samples_per_second": 6.994, - "eval_steps_per_second": 0.909, - "step": 64500 - }, - { - "epoch": 129.06, - "grad_norm": 71.56198120117188, - "learning_rate": 4.731930602986906e-07, - "loss": 0.3358, - "step": 64530 - }, - { - "epoch": 129.12, - "grad_norm": 25.362306594848633, - "learning_rate": 4.705285313735297e-07, - "loss": 0.3104, - "step": 64560 - }, - { - "epoch": 129.18, - "grad_norm": 51.97401428222656, - "learning_rate": 4.678711551020743e-07, - "loss": 0.3498, - "step": 64590 - }, - { - "epoch": 129.24, - "grad_norm": 72.9772720336914, - "learning_rate": 4.6522093568068307e-07, - "loss": 0.326, - "step": 64620 - }, - { - "epoch": 129.3, - "grad_norm": 0.0001010323321679607, - "learning_rate": 4.625778772944156e-07, - "loss": 0.5324, - "step": 64650 - }, - { - "epoch": 129.36, - "grad_norm": 57.38959503173828, - "learning_rate": 4.599419841170216e-07, - "loss": 0.3524, - "step": 64680 - }, - { - "epoch": 129.42, - "grad_norm": 52.89522933959961, - "learning_rate": 4.5731326031093645e-07, - "loss": 0.4292, - "step": 64710 - }, - { - "epoch": 129.48, - "grad_norm": 63.3166389465332, - "learning_rate": 4.546917100272735e-07, - "loss": 0.3784, - "step": 64740 - }, - { - "epoch": 129.54, - "grad_norm": 70.8720932006836, - "learning_rate": 4.520773374058179e-07, - "loss": 0.3363, - "step": 64770 - }, - { - "epoch": 129.6, - "grad_norm": 49.737701416015625, - "learning_rate": 4.494701465750217e-07, - "loss": 0.3516, - "step": 64800 - }, - { - "epoch": 129.66, - "grad_norm": 43.897071838378906, - "learning_rate": 4.4687014165199547e-07, - "loss": 0.3167, - "step": 64830 - }, - { - "epoch": 129.72, - "grad_norm": 26.70827865600586, - "learning_rate": 4.4427732674250045e-07, - "loss": 0.2829, - "step": 64860 - }, - { - "epoch": 129.78, - "grad_norm": 26.810070037841797, - "learning_rate": 4.416917059409465e-07, - "loss": 0.369, - "step": 64890 - }, - { - "epoch": 129.84, - "grad_norm": 43.5709114074707, - "learning_rate": 4.391132833303807e-07, - "loss": 0.4261, - "step": 64920 - }, - { - "epoch": 129.9, - "grad_norm": 47.29655838012695, - "learning_rate": 4.3654206298248625e-07, - "loss": 0.4163, - "step": 64950 - }, - { - "epoch": 129.96, - "grad_norm": 56.56647491455078, - "learning_rate": 4.3397804895756957e-07, - "loss": 0.2774, - "step": 64980 - }, - { - "epoch": 130.0, - "eval_loss": 0.287985622882843, - "eval_map": 0.7985, - "eval_map_50": 0.9623, - "eval_map_75": 0.8972, - "eval_map_chicken": 0.7842, - "eval_map_duck": 0.7457, - "eval_map_large": 0.8152, - "eval_map_medium": 0.8056, - "eval_map_plant": 0.8656, - "eval_map_small": 0.3337, - "eval_mar_1": 0.3174, - "eval_mar_10": 0.8363, - "eval_mar_100": 0.8424, - "eval_mar_100_chicken": 0.8313, - "eval_mar_100_duck": 0.7959, - "eval_mar_100_plant": 0.9, - "eval_mar_large": 0.8526, - "eval_mar_medium": 0.8472, - "eval_mar_small": 0.4286, - "eval_runtime": 14.6141, - "eval_samples_per_second": 6.843, - "eval_steps_per_second": 0.89, - "step": 65000 - }, - { - "epoch": 130.02, - "grad_norm": 54.62247848510742, - "learning_rate": 4.31421245304558e-07, - "loss": 0.3533, - "step": 65010 - }, - { - "epoch": 130.08, - "grad_norm": 64.50666809082031, - "learning_rate": 4.2887165606099513e-07, - "loss": 0.315, - "step": 65040 - }, - { - "epoch": 130.14, - "grad_norm": 28.4924259185791, - "learning_rate": 4.263292852530293e-07, - "loss": 0.4233, - "step": 65070 - }, - { - "epoch": 130.2, - "grad_norm": 108.92642211914062, - "learning_rate": 4.237941368954124e-07, - "loss": 0.3925, - "step": 65100 - }, - { - "epoch": 130.26, - "grad_norm": 25.28023338317871, - "learning_rate": 4.212662149914887e-07, - "loss": 0.4153, - "step": 65130 - }, - { - "epoch": 130.32, - "grad_norm": 38.81027603149414, - "learning_rate": 4.1874552353319107e-07, - "loss": 0.3781, - "step": 65160 - }, - { - "epoch": 130.38, - "grad_norm": 46.95817565917969, - "learning_rate": 4.162320665010372e-07, - "loss": 0.3524, - "step": 65190 - }, - { - "epoch": 130.44, - "grad_norm": 53.66548156738281, - "learning_rate": 4.137258478641176e-07, - "loss": 0.4081, - "step": 65220 - }, - { - "epoch": 130.5, - "grad_norm": 189.784912109375, - "learning_rate": 4.112268715800943e-07, - "loss": 0.442, - "step": 65250 - }, - { - "epoch": 130.56, - "grad_norm": 36.14055252075195, - "learning_rate": 4.087351415951918e-07, - "loss": 0.3566, - "step": 65280 - }, - { - "epoch": 130.62, - "grad_norm": 44.45828628540039, - "learning_rate": 4.062506618441908e-07, - "loss": 0.3864, - "step": 65310 - }, - { - "epoch": 130.68, - "grad_norm": 75.06278991699219, - "learning_rate": 4.0377343625042587e-07, - "loss": 0.3363, - "step": 65340 - }, - { - "epoch": 130.74, - "grad_norm": 63.461273193359375, - "learning_rate": 4.013034687257727e-07, - "loss": 0.358, - "step": 65370 - }, - { - "epoch": 130.8, - "grad_norm": 0.00011619520228123292, - "learning_rate": 3.9884076317064813e-07, - "loss": 0.4634, - "step": 65400 - }, - { - "epoch": 130.86, - "grad_norm": 51.01006317138672, - "learning_rate": 3.963853234740006e-07, - "loss": 0.3914, - "step": 65430 - }, - { - "epoch": 130.92, - "grad_norm": 38.83234405517578, - "learning_rate": 3.9393715351330243e-07, - "loss": 0.3827, - "step": 65460 - }, - { - "epoch": 130.98, - "grad_norm": 33.826419830322266, - "learning_rate": 3.9149625715455107e-07, - "loss": 0.3268, - "step": 65490 - }, - { - "epoch": 131.0, - "eval_loss": 0.2949516773223877, - "eval_map": 0.7966, - "eval_map_50": 0.9645, - "eval_map_75": 0.904, - "eval_map_chicken": 0.7806, - "eval_map_duck": 0.7465, - "eval_map_large": 0.8135, - "eval_map_medium": 0.8028, - "eval_map_plant": 0.8628, - "eval_map_small": 0.3272, - "eval_mar_1": 0.3162, - "eval_mar_10": 0.836, - "eval_mar_100": 0.8422, - "eval_mar_100_chicken": 0.8294, - "eval_mar_100_duck": 0.799, - "eval_mar_100_plant": 0.8982, - "eval_mar_large": 0.8531, - "eval_mar_medium": 0.8471, - "eval_mar_small": 0.4352, - "eval_runtime": 13.6836, - "eval_samples_per_second": 7.308, - "eval_steps_per_second": 0.95, - "step": 65500 - }, - { - "epoch": 131.04, - "grad_norm": 66.37953186035156, - "learning_rate": 3.890626382522539e-07, - "loss": 0.4373, - "step": 65520 - }, - { - "epoch": 131.1, - "grad_norm": 51.77748107910156, - "learning_rate": 3.866363006494256e-07, - "loss": 0.3255, - "step": 65550 - }, - { - "epoch": 131.16, - "grad_norm": 43.79826354980469, - "learning_rate": 3.8421724817758745e-07, - "loss": 0.326, - "step": 65580 - }, - { - "epoch": 131.22, - "grad_norm": 48.64401626586914, - "learning_rate": 3.818054846567515e-07, - "loss": 0.3303, - "step": 65610 - }, - { - "epoch": 131.28, - "grad_norm": 86.83602142333984, - "learning_rate": 3.794010138954213e-07, - "loss": 0.3713, - "step": 65640 - }, - { - "epoch": 131.34, - "grad_norm": 49.17142105102539, - "learning_rate": 3.770038396905862e-07, - "loss": 0.3325, - "step": 65670 - }, - { - "epoch": 131.4, - "grad_norm": 80.1779556274414, - "learning_rate": 3.7461396582771035e-07, - "loss": 0.3662, - "step": 65700 - }, - { - "epoch": 131.46, - "grad_norm": 41.394718170166016, - "learning_rate": 3.7223139608073e-07, - "loss": 0.3514, - "step": 65730 - }, - { - "epoch": 131.52, - "grad_norm": 36.34390640258789, - "learning_rate": 3.698561342120499e-07, - "loss": 0.4441, - "step": 65760 - }, - { - "epoch": 131.58, - "grad_norm": 101.07977294921875, - "learning_rate": 3.674881839725314e-07, - "loss": 0.3543, - "step": 65790 - }, - { - "epoch": 131.64, - "grad_norm": 63.61982345581055, - "learning_rate": 3.651275491014905e-07, - "loss": 0.4257, - "step": 65820 - }, - { - "epoch": 131.7, - "grad_norm": 0.0002082155697280541, - "learning_rate": 3.627742333266937e-07, - "loss": 0.2849, - "step": 65850 - }, - { - "epoch": 131.76, - "grad_norm": 32.257057189941406, - "learning_rate": 3.604282403643472e-07, - "loss": 0.4016, - "step": 65880 - }, - { - "epoch": 131.82, - "grad_norm": 67.80140686035156, - "learning_rate": 3.5808957391909315e-07, - "loss": 0.2716, - "step": 65910 - }, - { - "epoch": 131.88, - "grad_norm": 57.564090728759766, - "learning_rate": 3.557582376840063e-07, - "loss": 0.4208, - "step": 65940 - }, - { - "epoch": 131.94, - "grad_norm": 43.46548843383789, - "learning_rate": 3.534342353405834e-07, - "loss": 0.3586, - "step": 65970 - }, - { - "epoch": 132.0, - "grad_norm": 58.81836700439453, - "learning_rate": 3.511175705587433e-07, - "loss": 0.327, - "step": 66000 - }, - { - "epoch": 132.0, - "eval_loss": 0.2854064702987671, - "eval_map": 0.8026, - "eval_map_50": 0.9658, - "eval_map_75": 0.8916, - "eval_map_chicken": 0.7927, - "eval_map_duck": 0.7447, - "eval_map_large": 0.8186, - "eval_map_medium": 0.8085, - "eval_map_plant": 0.8704, - "eval_map_small": 0.3174, - "eval_mar_1": 0.3177, - "eval_mar_10": 0.8391, - "eval_mar_100": 0.845, - "eval_mar_100_chicken": 0.8369, - "eval_mar_100_duck": 0.7959, - "eval_mar_100_plant": 0.9021, - "eval_mar_large": 0.8567, - "eval_mar_medium": 0.8497, - "eval_mar_small": 0.4124, - "eval_runtime": 13.7357, - "eval_samples_per_second": 7.28, - "eval_steps_per_second": 0.946, - "step": 66000 - }, - { - "epoch": 132.06, - "grad_norm": 57.28191375732422, - "learning_rate": 3.488082469968146e-07, - "loss": 0.2886, - "step": 66030 - }, - { - "epoch": 132.12, - "grad_norm": 50.39839553833008, - "learning_rate": 3.465062683015341e-07, - "loss": 0.4037, - "step": 66060 - }, - { - "epoch": 132.18, - "grad_norm": 178.81991577148438, - "learning_rate": 3.442116381080418e-07, - "loss": 0.3479, - "step": 66090 - }, - { - "epoch": 132.24, - "grad_norm": 35.48100662231445, - "learning_rate": 3.419243600398703e-07, - "loss": 0.3567, - "step": 66120 - }, - { - "epoch": 132.3, - "grad_norm": 32.5038948059082, - "learning_rate": 3.396444377089453e-07, - "loss": 0.3543, - "step": 66150 - }, - { - "epoch": 132.36, - "grad_norm": 51.1141242980957, - "learning_rate": 3.373718747155752e-07, - "loss": 0.365, - "step": 66180 - }, - { - "epoch": 132.42, - "grad_norm": 59.56440353393555, - "learning_rate": 3.351066746484455e-07, - "loss": 0.3682, - "step": 66210 - }, - { - "epoch": 132.48, - "grad_norm": 190.19277954101562, - "learning_rate": 3.328488410846187e-07, - "loss": 0.4171, - "step": 66240 - }, - { - "epoch": 132.54, - "grad_norm": 20.468778610229492, - "learning_rate": 3.3059837758951995e-07, - "loss": 0.3483, - "step": 66270 - }, - { - "epoch": 132.6, - "grad_norm": 21.8949031829834, - "learning_rate": 3.283552877169399e-07, - "loss": 0.3236, - "step": 66300 - }, - { - "epoch": 132.66, - "grad_norm": 53.96356964111328, - "learning_rate": 3.2611957500902345e-07, - "loss": 0.2952, - "step": 66330 - }, - { - "epoch": 132.72, - "grad_norm": 57.27799606323242, - "learning_rate": 3.2389124299626483e-07, - "loss": 0.3828, - "step": 66360 - }, - { - "epoch": 132.78, - "grad_norm": 40.665035247802734, - "learning_rate": 3.216702951975059e-07, - "loss": 0.3993, - "step": 66390 - }, - { - "epoch": 132.84, - "grad_norm": 113.07135772705078, - "learning_rate": 3.194567351199257e-07, - "loss": 0.3451, - "step": 66420 - }, - { - "epoch": 132.9, - "grad_norm": 52.17920684814453, - "learning_rate": 3.172505662590386e-07, - "loss": 0.375, - "step": 66450 - }, - { - "epoch": 132.96, - "grad_norm": 46.23152160644531, - "learning_rate": 3.150517920986851e-07, - "loss": 0.3712, - "step": 66480 - }, - { - "epoch": 133.0, - "eval_loss": 0.2902440130710602, - "eval_map": 0.8018, - "eval_map_50": 0.9658, - "eval_map_75": 0.8912, - "eval_map_chicken": 0.7912, - "eval_map_duck": 0.7457, - "eval_map_large": 0.8175, - "eval_map_medium": 0.8063, - "eval_map_plant": 0.8686, - "eval_map_small": 0.3277, - "eval_mar_1": 0.3174, - "eval_mar_10": 0.8391, - "eval_mar_100": 0.8449, - "eval_mar_100_chicken": 0.8365, - "eval_mar_100_duck": 0.7969, - "eval_mar_100_plant": 0.9012, - "eval_mar_large": 0.8584, - "eval_mar_medium": 0.8477, - "eval_mar_small": 0.4352, - "eval_runtime": 14.2745, - "eval_samples_per_second": 7.005, - "eval_steps_per_second": 0.911, - "step": 66500 - }, - { - "epoch": 133.02, - "grad_norm": 46.68117904663086, - "learning_rate": 3.128604161110299e-07, - "loss": 0.3958, - "step": 66510 - }, - { - "epoch": 133.08, - "grad_norm": 190.38941955566406, - "learning_rate": 3.106764417565561e-07, - "loss": 0.3325, - "step": 66540 - }, - { - "epoch": 133.14, - "grad_norm": 72.22937774658203, - "learning_rate": 3.08499872484056e-07, - "loss": 0.3495, - "step": 66570 - }, - { - "epoch": 133.2, - "grad_norm": 45.56755447387695, - "learning_rate": 3.0633071173062966e-07, - "loss": 0.3537, - "step": 66600 - }, - { - "epoch": 133.26, - "grad_norm": 45.41728591918945, - "learning_rate": 3.0416896292167873e-07, - "loss": 0.3928, - "step": 66630 - }, - { - "epoch": 133.32, - "grad_norm": 53.52821350097656, - "learning_rate": 3.0201462947089865e-07, - "loss": 0.341, - "step": 66660 - }, - { - "epoch": 133.38, - "grad_norm": 91.77867126464844, - "learning_rate": 2.99867714780277e-07, - "loss": 0.3923, - "step": 66690 - }, - { - "epoch": 133.44, - "grad_norm": 41.08647918701172, - "learning_rate": 2.9772822224008515e-07, - "loss": 0.3136, - "step": 66720 - }, - { - "epoch": 133.5, - "grad_norm": 165.907470703125, - "learning_rate": 2.9559615522887275e-07, - "loss": 0.3472, - "step": 66750 - }, - { - "epoch": 133.56, - "grad_norm": 89.72096252441406, - "learning_rate": 2.9347151711346556e-07, - "loss": 0.4876, - "step": 66780 - }, - { - "epoch": 133.62, - "grad_norm": 65.85697937011719, - "learning_rate": 2.913543112489564e-07, - "loss": 0.3345, - "step": 66810 - }, - { - "epoch": 133.68, - "grad_norm": 58.98741149902344, - "learning_rate": 2.892445409787037e-07, - "loss": 0.3719, - "step": 66840 - }, - { - "epoch": 133.74, - "grad_norm": 66.10700225830078, - "learning_rate": 2.8714220963432125e-07, - "loss": 0.3723, - "step": 66870 - }, - { - "epoch": 133.8, - "grad_norm": 43.45757293701172, - "learning_rate": 2.850473205356774e-07, - "loss": 0.3382, - "step": 66900 - }, - { - "epoch": 133.86, - "grad_norm": 38.253074645996094, - "learning_rate": 2.829598769908892e-07, - "loss": 0.3118, - "step": 66930 - }, - { - "epoch": 133.92, - "grad_norm": 39.28963851928711, - "learning_rate": 2.8087988229631325e-07, - "loss": 0.3559, - "step": 66960 - }, - { - "epoch": 133.98, - "grad_norm": 43.38936233520508, - "learning_rate": 2.788073397365465e-07, - "loss": 0.3267, - "step": 66990 - }, - { - "epoch": 134.0, - "eval_loss": 0.28852832317352295, - "eval_map": 0.8009, - "eval_map_50": 0.964, - "eval_map_75": 0.8987, - "eval_map_chicken": 0.7863, - "eval_map_duck": 0.7468, - "eval_map_large": 0.8133, - "eval_map_medium": 0.8065, - "eval_map_plant": 0.8696, - "eval_map_small": 0.3322, - "eval_mar_1": 0.3167, - "eval_mar_10": 0.8384, - "eval_mar_100": 0.8438, - "eval_mar_100_chicken": 0.8321, - "eval_mar_100_duck": 0.7969, - "eval_mar_100_plant": 0.9024, - "eval_mar_large": 0.8523, - "eval_mar_medium": 0.8484, - "eval_mar_small": 0.4252, - "eval_runtime": 14.4872, - "eval_samples_per_second": 6.903, - "eval_steps_per_second": 0.897, - "step": 67000 - }, - { - "epoch": 134.04, - "grad_norm": 109.6541519165039, - "learning_rate": 2.76742252584416e-07, - "loss": 0.3697, - "step": 67020 - }, - { - "epoch": 134.1, - "grad_norm": 50.6714973449707, - "learning_rate": 2.746846241009765e-07, - "loss": 0.4235, - "step": 67050 - }, - { - "epoch": 134.16, - "grad_norm": 46.14804458618164, - "learning_rate": 2.7263445753550275e-07, - "loss": 0.3751, - "step": 67080 - }, - { - "epoch": 134.22, - "grad_norm": 45.713138580322266, - "learning_rate": 2.7059175612548947e-07, - "loss": 0.3713, - "step": 67110 - }, - { - "epoch": 134.28, - "grad_norm": 36.28562545776367, - "learning_rate": 2.685565230966408e-07, - "loss": 0.2888, - "step": 67140 - }, - { - "epoch": 134.34, - "grad_norm": 36.700775146484375, - "learning_rate": 2.665287616628659e-07, - "loss": 0.3553, - "step": 67170 - }, - { - "epoch": 134.4, - "grad_norm": 44.0689697265625, - "learning_rate": 2.6450847502627883e-07, - "loss": 0.4438, - "step": 67200 - }, - { - "epoch": 134.46, - "grad_norm": 21.92855453491211, - "learning_rate": 2.6249566637718714e-07, - "loss": 0.4085, - "step": 67230 - }, - { - "epoch": 134.52, - "grad_norm": 42.19912338256836, - "learning_rate": 2.604903388940899e-07, - "loss": 0.326, - "step": 67260 - }, - { - "epoch": 134.58, - "grad_norm": 55.26387405395508, - "learning_rate": 2.584924957436735e-07, - "loss": 0.28, - "step": 67290 - }, - { - "epoch": 134.64, - "grad_norm": 48.82943344116211, - "learning_rate": 2.5650214008080544e-07, - "loss": 0.3009, - "step": 67320 - }, - { - "epoch": 134.7, - "grad_norm": 85.5448989868164, - "learning_rate": 2.5451927504852757e-07, - "loss": 0.3113, - "step": 67350 - }, - { - "epoch": 134.76, - "grad_norm": 33.30947494506836, - "learning_rate": 2.525439037780558e-07, - "loss": 0.3877, - "step": 67380 - }, - { - "epoch": 134.82, - "grad_norm": 42.817466735839844, - "learning_rate": 2.505760293887699e-07, - "loss": 0.3209, - "step": 67410 - }, - { - "epoch": 134.88, - "grad_norm": 147.4586639404297, - "learning_rate": 2.486156549882135e-07, - "loss": 0.4274, - "step": 67440 - }, - { - "epoch": 134.94, - "grad_norm": 29.05756187438965, - "learning_rate": 2.4666278367208417e-07, - "loss": 0.3726, - "step": 67470 - }, - { - "epoch": 135.0, - "grad_norm": 70.35362243652344, - "learning_rate": 2.447174185242324e-07, - "loss": 0.4273, - "step": 67500 - }, - { - "epoch": 135.0, - "eval_loss": 0.2911410927772522, - "eval_map": 0.7979, - "eval_map_50": 0.9638, - "eval_map_75": 0.9028, - "eval_map_chicken": 0.7828, - "eval_map_duck": 0.7428, - "eval_map_large": 0.8095, - "eval_map_medium": 0.8033, - "eval_map_plant": 0.8681, - "eval_map_small": 0.3267, - "eval_mar_1": 0.3175, - "eval_mar_10": 0.8352, - "eval_mar_100": 0.8406, - "eval_mar_100_chicken": 0.8298, - "eval_mar_100_duck": 0.7918, - "eval_mar_100_plant": 0.9003, - "eval_mar_large": 0.8494, - "eval_mar_medium": 0.8448, - "eval_mar_small": 0.4205, - "eval_runtime": 13.8699, - "eval_samples_per_second": 7.21, - "eval_steps_per_second": 0.937, - "step": 67500 - }, - { - "epoch": 135.06, - "grad_norm": 42.571895599365234, - "learning_rate": 2.4277956261665624e-07, - "loss": 0.4658, - "step": 67530 - }, - { - "epoch": 135.12, - "grad_norm": 61.84291458129883, - "learning_rate": 2.40849219009493e-07, - "loss": 0.3557, - "step": 67560 - }, - { - "epoch": 135.18, - "grad_norm": 82.146484375, - "learning_rate": 2.389263907510209e-07, - "loss": 0.3332, - "step": 67590 - }, - { - "epoch": 135.24, - "grad_norm": 25.76155662536621, - "learning_rate": 2.3701108087764657e-07, - "loss": 0.3536, - "step": 67620 - }, - { - "epoch": 135.3, - "grad_norm": 106.06716918945312, - "learning_rate": 2.351032924139063e-07, - "loss": 0.3805, - "step": 67650 - }, - { - "epoch": 135.36, - "grad_norm": 64.08528900146484, - "learning_rate": 2.3320302837245846e-07, - "loss": 0.3396, - "step": 67680 - }, - { - "epoch": 135.42, - "grad_norm": 67.47964477539062, - "learning_rate": 2.3131029175407883e-07, - "loss": 0.3214, - "step": 67710 - }, - { - "epoch": 135.48, - "grad_norm": 109.34996795654297, - "learning_rate": 2.2942508554765764e-07, - "loss": 0.3533, - "step": 67740 - }, - { - "epoch": 135.54, - "grad_norm": 73.63320922851562, - "learning_rate": 2.27547412730193e-07, - "loss": 0.3323, - "step": 67770 - }, - { - "epoch": 135.6, - "grad_norm": 31.16606330871582, - "learning_rate": 2.2567727626678527e-07, - "loss": 0.2959, - "step": 67800 - }, - { - "epoch": 135.66, - "grad_norm": 40.19267654418945, - "learning_rate": 2.2381467911063658e-07, - "loss": 0.3962, - "step": 67830 - }, - { - "epoch": 135.72, - "grad_norm": 36.41028594970703, - "learning_rate": 2.2195962420304083e-07, - "loss": 0.3573, - "step": 67860 - }, - { - "epoch": 135.78, - "grad_norm": 48.676414489746094, - "learning_rate": 2.2011211447338477e-07, - "loss": 0.3599, - "step": 67890 - }, - { - "epoch": 135.84, - "grad_norm": 115.03677368164062, - "learning_rate": 2.1827215283913683e-07, - "loss": 0.3128, - "step": 67920 - }, - { - "epoch": 135.9, - "grad_norm": 75.01472473144531, - "learning_rate": 2.1643974220584729e-07, - "loss": 0.4229, - "step": 67950 - }, - { - "epoch": 135.96, - "grad_norm": 78.67342376708984, - "learning_rate": 2.1461488546714425e-07, - "loss": 0.3564, - "step": 67980 - }, - { - "epoch": 136.0, - "eval_loss": 0.2914939522743225, - "eval_map": 0.797, - "eval_map_50": 0.9634, - "eval_map_75": 0.9013, - "eval_map_chicken": 0.7825, - "eval_map_duck": 0.7411, - "eval_map_large": 0.818, - "eval_map_medium": 0.8023, - "eval_map_plant": 0.8674, - "eval_map_small": 0.3325, - "eval_mar_1": 0.3176, - "eval_mar_10": 0.8349, - "eval_mar_100": 0.8406, - "eval_mar_100_chicken": 0.8286, - "eval_mar_100_duck": 0.7918, - "eval_mar_100_plant": 0.9015, - "eval_mar_large": 0.8553, - "eval_mar_medium": 0.8449, - "eval_mar_small": 0.419, - "eval_runtime": 14.7026, - "eval_samples_per_second": 6.802, - "eval_steps_per_second": 0.884, - "step": 68000 - }, - { - "epoch": 136.02, - "grad_norm": 211.8123779296875, - "learning_rate": 2.127975855047243e-07, - "loss": 0.5481, - "step": 68010 - }, - { - "epoch": 136.08, - "grad_norm": 39.24762725830078, - "learning_rate": 2.1098784518835292e-07, - "loss": 0.3468, - "step": 68040 - }, - { - "epoch": 136.14, - "grad_norm": 75.79733276367188, - "learning_rate": 2.0918566737585688e-07, - "loss": 0.3446, - "step": 68070 - }, - { - "epoch": 136.2, - "grad_norm": 162.20359802246094, - "learning_rate": 2.0739105491312028e-07, - "loss": 0.3352, - "step": 68100 - }, - { - "epoch": 136.26, - "grad_norm": 57.89274597167969, - "learning_rate": 2.056040106340823e-07, - "loss": 0.4676, - "step": 68130 - }, - { - "epoch": 136.32, - "grad_norm": 61.71417236328125, - "learning_rate": 2.0382453736072838e-07, - "loss": 0.386, - "step": 68160 - }, - { - "epoch": 136.38, - "grad_norm": 70.39722442626953, - "learning_rate": 2.0205263790309125e-07, - "loss": 0.272, - "step": 68190 - }, - { - "epoch": 136.44, - "grad_norm": 66.32408905029297, - "learning_rate": 2.0028831505924162e-07, - "loss": 0.3302, - "step": 68220 - }, - { - "epoch": 136.5, - "grad_norm": 42.234256744384766, - "learning_rate": 1.9853157161528468e-07, - "loss": 0.3163, - "step": 68250 - }, - { - "epoch": 136.56, - "grad_norm": 72.14662170410156, - "learning_rate": 1.967824103453597e-07, - "loss": 0.3368, - "step": 68280 - }, - { - "epoch": 136.62, - "grad_norm": 44.91769790649414, - "learning_rate": 1.9504083401162999e-07, - "loss": 0.4026, - "step": 68310 - }, - { - "epoch": 136.68, - "grad_norm": 92.38590240478516, - "learning_rate": 1.9330684536428335e-07, - "loss": 0.327, - "step": 68340 - }, - { - "epoch": 136.74, - "grad_norm": 42.71702194213867, - "learning_rate": 1.9158044714152447e-07, - "loss": 0.3716, - "step": 68370 - }, - { - "epoch": 136.8, - "grad_norm": 53.39596939086914, - "learning_rate": 1.8986164206957037e-07, - "loss": 0.3533, - "step": 68400 - }, - { - "epoch": 136.86, - "grad_norm": 32.2762565612793, - "learning_rate": 1.8815043286265044e-07, - "loss": 0.3279, - "step": 68430 - }, - { - "epoch": 136.92, - "grad_norm": 33.744667053222656, - "learning_rate": 1.8644682222299703e-07, - "loss": 0.3219, - "step": 68460 - }, - { - "epoch": 136.98, - "grad_norm": 73.03089141845703, - "learning_rate": 1.8475081284084428e-07, - "loss": 0.358, - "step": 68490 - }, - { - "epoch": 137.0, - "eval_loss": 0.2883448302745819, - "eval_map": 0.8007, - "eval_map_50": 0.9635, - "eval_map_75": 0.9034, - "eval_map_chicken": 0.7868, - "eval_map_duck": 0.7455, - "eval_map_large": 0.8189, - "eval_map_medium": 0.8054, - "eval_map_plant": 0.8698, - "eval_map_small": 0.3399, - "eval_mar_1": 0.3187, - "eval_mar_10": 0.8379, - "eval_mar_100": 0.8434, - "eval_mar_100_chicken": 0.8333, - "eval_mar_100_duck": 0.7948, - "eval_mar_100_plant": 0.9021, - "eval_mar_large": 0.8564, - "eval_mar_medium": 0.8469, - "eval_mar_small": 0.4367, - "eval_runtime": 12.8356, - "eval_samples_per_second": 7.791, - "eval_steps_per_second": 1.013, - "step": 68500 - }, - { - "epoch": 137.04, - "grad_norm": 68.37001037597656, - "learning_rate": 1.8306240739442094e-07, - "loss": 0.3544, - "step": 68520 - }, - { - "epoch": 137.1, - "grad_norm": 29.655811309814453, - "learning_rate": 1.8138160854995145e-07, - "loss": 0.3628, - "step": 68550 - }, - { - "epoch": 137.16, - "grad_norm": 39.01556396484375, - "learning_rate": 1.7970841896164658e-07, - "loss": 0.3693, - "step": 68580 - }, - { - "epoch": 137.22, - "grad_norm": 51.84676742553711, - "learning_rate": 1.7804284127169946e-07, - "loss": 0.3564, - "step": 68610 - }, - { - "epoch": 137.28, - "grad_norm": 37.72648620605469, - "learning_rate": 1.7638487811028616e-07, - "loss": 0.3348, - "step": 68640 - }, - { - "epoch": 137.34, - "grad_norm": 84.99642181396484, - "learning_rate": 1.7473453209555625e-07, - "loss": 0.338, - "step": 68670 - }, - { - "epoch": 137.4, - "grad_norm": 65.15522003173828, - "learning_rate": 1.7309180583363062e-07, - "loss": 0.4385, - "step": 68700 - }, - { - "epoch": 137.46, - "grad_norm": 78.89385986328125, - "learning_rate": 1.7145670191859977e-07, - "loss": 0.3528, - "step": 68730 - }, - { - "epoch": 137.52, - "grad_norm": 71.5306396484375, - "learning_rate": 1.6982922293251548e-07, - "loss": 0.3505, - "step": 68760 - }, - { - "epoch": 137.58, - "grad_norm": 51.439693450927734, - "learning_rate": 1.6820937144538807e-07, - "loss": 0.3758, - "step": 68790 - }, - { - "epoch": 137.64, - "grad_norm": 59.33545684814453, - "learning_rate": 1.6659715001518583e-07, - "loss": 0.3499, - "step": 68820 - }, - { - "epoch": 137.7, - "grad_norm": 41.85493850708008, - "learning_rate": 1.6499256118782503e-07, - "loss": 0.3502, - "step": 68850 - }, - { - "epoch": 137.76, - "grad_norm": 55.376251220703125, - "learning_rate": 1.6339560749717154e-07, - "loss": 0.3846, - "step": 68880 - }, - { - "epoch": 137.82, - "grad_norm": 63.67637634277344, - "learning_rate": 1.6180629146503256e-07, - "loss": 0.392, - "step": 68910 - }, - { - "epoch": 137.88, - "grad_norm": 38.77060317993164, - "learning_rate": 1.6022461560115498e-07, - "loss": 0.4113, - "step": 68940 - }, - { - "epoch": 137.94, - "grad_norm": 39.97504806518555, - "learning_rate": 1.586505824032214e-07, - "loss": 0.3014, - "step": 68970 - }, - { - "epoch": 138.0, - "grad_norm": 121.58015441894531, - "learning_rate": 1.5708419435684463e-07, - "loss": 0.3715, - "step": 69000 - }, - { - "epoch": 138.0, - "eval_loss": 0.2868429720401764, - "eval_map": 0.7973, - "eval_map_50": 0.9632, - "eval_map_75": 0.9007, - "eval_map_chicken": 0.7847, - "eval_map_duck": 0.7397, - "eval_map_large": 0.8125, - "eval_map_medium": 0.8025, - "eval_map_plant": 0.8676, - "eval_map_small": 0.3366, - "eval_mar_1": 0.3172, - "eval_mar_10": 0.8358, - "eval_mar_100": 0.8413, - "eval_mar_100_chicken": 0.8317, - "eval_mar_100_duck": 0.7907, - "eval_mar_100_plant": 0.9015, - "eval_mar_large": 0.8521, - "eval_mar_medium": 0.8446, - "eval_mar_small": 0.4286, - "eval_runtime": 14.578, - "eval_samples_per_second": 6.86, - "eval_steps_per_second": 0.892, - "step": 69000 - }, - { - "epoch": 138.06, - "grad_norm": 67.07673645019531, - "learning_rate": 1.555254539355655e-07, - "loss": 0.3319, - "step": 69030 - }, - { - "epoch": 138.12, - "grad_norm": 101.25053405761719, - "learning_rate": 1.5397436360084784e-07, - "loss": 0.3278, - "step": 69060 - }, - { - "epoch": 138.18, - "grad_norm": 49.164764404296875, - "learning_rate": 1.5243092580207507e-07, - "loss": 0.3755, - "step": 69090 - }, - { - "epoch": 138.24, - "grad_norm": 77.7751693725586, - "learning_rate": 1.5089514297654594e-07, - "loss": 0.3228, - "step": 69120 - }, - { - "epoch": 138.3, - "grad_norm": 55.398651123046875, - "learning_rate": 1.4936701754947104e-07, - "loss": 0.3178, - "step": 69150 - }, - { - "epoch": 138.36, - "grad_norm": 57.23589324951172, - "learning_rate": 1.4784655193396947e-07, - "loss": 0.3482, - "step": 69180 - }, - { - "epoch": 138.42, - "grad_norm": 66.49388122558594, - "learning_rate": 1.463337485310634e-07, - "loss": 0.376, - "step": 69210 - }, - { - "epoch": 138.48, - "grad_norm": 95.41547393798828, - "learning_rate": 1.448286097296764e-07, - "loss": 0.3877, - "step": 69240 - }, - { - "epoch": 138.54, - "grad_norm": 40.57638168334961, - "learning_rate": 1.4333113790662822e-07, - "loss": 0.4282, - "step": 69270 - }, - { - "epoch": 138.6, - "grad_norm": 60.66424560546875, - "learning_rate": 1.4184133542663014e-07, - "loss": 0.3146, - "step": 69300 - }, - { - "epoch": 138.66, - "grad_norm": 54.92922592163086, - "learning_rate": 1.4035920464228525e-07, - "loss": 0.3744, - "step": 69330 - }, - { - "epoch": 138.72, - "grad_norm": 62.56671905517578, - "learning_rate": 1.388847478940797e-07, - "loss": 0.323, - "step": 69360 - }, - { - "epoch": 138.78, - "grad_norm": 38.13356399536133, - "learning_rate": 1.3741796751038095e-07, - "loss": 0.3275, - "step": 69390 - }, - { - "epoch": 138.84, - "grad_norm": 28.64565086364746, - "learning_rate": 1.3595886580743677e-07, - "loss": 0.3618, - "step": 69420 - }, - { - "epoch": 138.9, - "grad_norm": 63.989463806152344, - "learning_rate": 1.3450744508936687e-07, - "loss": 0.3898, - "step": 69450 - }, - { - "epoch": 138.96, - "grad_norm": 169.14093017578125, - "learning_rate": 1.330637076481639e-07, - "loss": 0.4042, - "step": 69480 - }, - { - "epoch": 139.0, - "eval_loss": 0.28515276312828064, - "eval_map": 0.8022, - "eval_map_50": 0.9636, - "eval_map_75": 0.903, - "eval_map_chicken": 0.7864, - "eval_map_duck": 0.7506, - "eval_map_large": 0.8131, - "eval_map_medium": 0.8065, - "eval_map_plant": 0.8695, - "eval_map_small": 0.341, - "eval_mar_1": 0.3187, - "eval_mar_10": 0.84, - "eval_mar_100": 0.8453, - "eval_mar_100_chicken": 0.8333, - "eval_mar_100_duck": 0.801, - "eval_mar_100_plant": 0.9015, - "eval_mar_large": 0.853, - "eval_mar_medium": 0.849, - "eval_mar_small": 0.4381, - "eval_runtime": 14.6737, - "eval_samples_per_second": 6.815, - "eval_steps_per_second": 0.886, - "step": 69500 - }, - { - "epoch": 139.02, - "grad_norm": 32.88087844848633, - "learning_rate": 1.3162765576368587e-07, - "loss": 0.3129, - "step": 69510 - }, - { - "epoch": 139.08, - "grad_norm": 31.760162353515625, - "learning_rate": 1.3019929170365376e-07, - "loss": 0.4039, - "step": 69540 - }, - { - "epoch": 139.14, - "grad_norm": 91.92324829101562, - "learning_rate": 1.287786177236511e-07, - "loss": 0.2552, - "step": 69570 - }, - { - "epoch": 139.2, - "grad_norm": 34.206764221191406, - "learning_rate": 1.2736563606711384e-07, - "loss": 0.4044, - "step": 69600 - }, - { - "epoch": 139.26, - "grad_norm": 104.41314697265625, - "learning_rate": 1.259603489653355e-07, - "loss": 0.4223, - "step": 69630 - }, - { - "epoch": 139.32, - "grad_norm": 57.35292053222656, - "learning_rate": 1.2456275863745426e-07, - "loss": 0.3795, - "step": 69660 - }, - { - "epoch": 139.38, - "grad_norm": 80.43934631347656, - "learning_rate": 1.2317286729045586e-07, - "loss": 0.3923, - "step": 69690 - }, - { - "epoch": 139.44, - "grad_norm": 87.62979125976562, - "learning_rate": 1.2179067711917015e-07, - "loss": 0.4593, - "step": 69720 - }, - { - "epoch": 139.5, - "grad_norm": 43.982688903808594, - "learning_rate": 1.2041619030626283e-07, - "loss": 0.338, - "step": 69750 - }, - { - "epoch": 139.56, - "grad_norm": 54.61286926269531, - "learning_rate": 1.1904940902223661e-07, - "loss": 0.3105, - "step": 69780 - }, - { - "epoch": 139.62, - "grad_norm": 119.23469543457031, - "learning_rate": 1.1769033542542552e-07, - "loss": 0.3612, - "step": 69810 - }, - { - "epoch": 139.68, - "grad_norm": 46.48311996459961, - "learning_rate": 1.1633897166199227e-07, - "loss": 0.3571, - "step": 69840 - }, - { - "epoch": 139.74, - "grad_norm": 207.8822784423828, - "learning_rate": 1.1499531986592482e-07, - "loss": 0.3269, - "step": 69870 - }, - { - "epoch": 139.8, - "grad_norm": 341.46990966796875, - "learning_rate": 1.136593821590326e-07, - "loss": 0.4198, - "step": 69900 - }, - { - "epoch": 139.86, - "grad_norm": 28.238218307495117, - "learning_rate": 1.1233116065094363e-07, - "loss": 0.3042, - "step": 69930 - }, - { - "epoch": 139.92, - "grad_norm": 40.68604278564453, - "learning_rate": 1.1101065743910122e-07, - "loss": 0.5129, - "step": 69960 - }, - { - "epoch": 139.98, - "grad_norm": 45.59909439086914, - "learning_rate": 1.0969787460876013e-07, - "loss": 0.3881, - "step": 69990 - }, - { - "epoch": 140.0, - "eval_loss": 0.28711405396461487, - "eval_map": 0.8016, - "eval_map_50": 0.9632, - "eval_map_75": 0.8966, - "eval_map_chicken": 0.7864, - "eval_map_duck": 0.7496, - "eval_map_large": 0.8174, - "eval_map_medium": 0.8064, - "eval_map_plant": 0.8687, - "eval_map_small": 0.3441, - "eval_mar_1": 0.3176, - "eval_mar_10": 0.8384, - "eval_mar_100": 0.8437, - "eval_mar_100_chicken": 0.831, - "eval_mar_100_duck": 0.799, - "eval_mar_100_plant": 0.9012, - "eval_mar_large": 0.8561, - "eval_mar_medium": 0.8472, - "eval_mar_small": 0.4348, - "eval_runtime": 13.3807, - "eval_samples_per_second": 7.473, - "eval_steps_per_second": 0.972, - "step": 70000 - }, - { - "epoch": 140.04, - "grad_norm": 49.717437744140625, - "learning_rate": 1.0839281423298375e-07, - "loss": 0.4085, - "step": 70020 - }, - { - "epoch": 140.1, - "grad_norm": 77.0780258178711, - "learning_rate": 1.0709547837263967e-07, - "loss": 0.294, - "step": 70050 - }, - { - "epoch": 140.16, - "grad_norm": 52.57013702392578, - "learning_rate": 1.0580586907639912e-07, - "loss": 0.3965, - "step": 70080 - }, - { - "epoch": 140.22, - "grad_norm": 36.34819793701172, - "learning_rate": 1.0452398838073141e-07, - "loss": 0.4028, - "step": 70110 - }, - { - "epoch": 140.28, - "grad_norm": 114.36404418945312, - "learning_rate": 1.032498383099001e-07, - "loss": 0.3522, - "step": 70140 - }, - { - "epoch": 140.34, - "grad_norm": 61.337974548339844, - "learning_rate": 1.0198342087596292e-07, - "loss": 0.3825, - "step": 70170 - }, - { - "epoch": 140.4, - "grad_norm": 25.393247604370117, - "learning_rate": 1.007247380787657e-07, - "loss": 0.3265, - "step": 70200 - }, - { - "epoch": 140.46, - "grad_norm": 84.1668930053711, - "learning_rate": 9.947379190594076e-08, - "loss": 0.2991, - "step": 70230 - }, - { - "epoch": 140.52, - "grad_norm": 38.32514572143555, - "learning_rate": 9.823058433290178e-08, - "loss": 0.3119, - "step": 70260 - }, - { - "epoch": 140.58, - "grad_norm": 63.19240951538086, - "learning_rate": 9.699511732284395e-08, - "loss": 0.5792, - "step": 70290 - }, - { - "epoch": 140.64, - "grad_norm": 8.30960925668478e-05, - "learning_rate": 9.576739282673886e-08, - "loss": 0.3746, - "step": 70320 - }, - { - "epoch": 140.7, - "grad_norm": 63.64250183105469, - "learning_rate": 9.454741278333013e-08, - "loss": 0.3033, - "step": 70350 - }, - { - "epoch": 140.76, - "grad_norm": 49.97964859008789, - "learning_rate": 9.333517911913281e-08, - "loss": 0.3494, - "step": 70380 - }, - { - "epoch": 140.82, - "grad_norm": 85.51181030273438, - "learning_rate": 9.213069374842953e-08, - "loss": 0.3608, - "step": 70410 - }, - { - "epoch": 140.88, - "grad_norm": 99.78071594238281, - "learning_rate": 9.093395857326714e-08, - "loss": 0.3545, - "step": 70440 - }, - { - "epoch": 140.94, - "grad_norm": 27.587324142456055, - "learning_rate": 8.974497548345396e-08, - "loss": 0.3373, - "step": 70470 - }, - { - "epoch": 141.0, - "grad_norm": 114.62167358398438, - "learning_rate": 8.856374635655696e-08, - "loss": 0.3214, - "step": 70500 - }, - { - "epoch": 141.0, - "eval_loss": 0.28778883814811707, - "eval_map": 0.798, - "eval_map_50": 0.9632, - "eval_map_75": 0.8974, - "eval_map_chicken": 0.7844, - "eval_map_duck": 0.7425, - "eval_map_large": 0.8145, - "eval_map_medium": 0.8015, - "eval_map_plant": 0.8671, - "eval_map_small": 0.3421, - "eval_mar_1": 0.316, - "eval_mar_10": 0.8372, - "eval_mar_100": 0.8423, - "eval_mar_100_chicken": 0.8306, - "eval_mar_100_duck": 0.7969, - "eval_mar_100_plant": 0.8994, - "eval_mar_large": 0.8547, - "eval_mar_medium": 0.8449, - "eval_mar_small": 0.4381, - "eval_runtime": 13.9156, - "eval_samples_per_second": 7.186, - "eval_steps_per_second": 0.934, - "step": 70500 - }, - { - "epoch": 141.06, - "grad_norm": 0.0002042367705143988, - "learning_rate": 8.739027305789682e-08, - "loss": 0.3125, - "step": 70530 - }, - { - "epoch": 141.12, - "grad_norm": 30.428842544555664, - "learning_rate": 8.622455744054958e-08, - "loss": 0.4564, - "step": 70560 - }, - { - "epoch": 141.18, - "grad_norm": 139.28721618652344, - "learning_rate": 8.506660134533828e-08, - "loss": 0.3745, - "step": 70590 - }, - { - "epoch": 141.24, - "grad_norm": 46.43798065185547, - "learning_rate": 8.391640660083411e-08, - "loss": 0.3477, - "step": 70620 - }, - { - "epoch": 141.3, - "grad_norm": 88.65122985839844, - "learning_rate": 8.277397502335194e-08, - "loss": 0.3021, - "step": 70650 - }, - { - "epoch": 141.36, - "grad_norm": 21.00395965576172, - "learning_rate": 8.163930841694589e-08, - "loss": 0.3501, - "step": 70680 - }, - { - "epoch": 141.42, - "grad_norm": 37.91747283935547, - "learning_rate": 8.051240857341102e-08, - "loss": 0.4402, - "step": 70710 - }, - { - "epoch": 141.48, - "grad_norm": 30.93425941467285, - "learning_rate": 7.939327727227441e-08, - "loss": 0.3929, - "step": 70740 - }, - { - "epoch": 141.54, - "grad_norm": 80.28870391845703, - "learning_rate": 7.828191628079851e-08, - "loss": 0.291, - "step": 70770 - }, - { - "epoch": 141.6, - "grad_norm": 93.69755554199219, - "learning_rate": 7.717832735397335e-08, - "loss": 0.3465, - "step": 70800 - }, - { - "epoch": 141.66, - "grad_norm": 89.86848449707031, - "learning_rate": 7.608251223451601e-08, - "loss": 0.3483, - "step": 70830 - }, - { - "epoch": 141.72, - "grad_norm": 75.96288299560547, - "learning_rate": 7.499447265286952e-08, - "loss": 0.389, - "step": 70860 - }, - { - "epoch": 141.78, - "grad_norm": 54.10462951660156, - "learning_rate": 7.39142103271956e-08, - "loss": 0.3949, - "step": 70890 - }, - { - "epoch": 141.84, - "grad_norm": 55.18855285644531, - "learning_rate": 7.284172696337688e-08, - "loss": 0.4104, - "step": 70920 - }, - { - "epoch": 141.9, - "grad_norm": 49.38865661621094, - "learning_rate": 7.177702425500977e-08, - "loss": 0.3755, - "step": 70950 - }, - { - "epoch": 141.96, - "grad_norm": 215.8840789794922, - "learning_rate": 7.072010388340656e-08, - "loss": 0.3357, - "step": 70980 - }, - { - "epoch": 142.0, - "eval_loss": 0.2879177927970886, - "eval_map": 0.7978, - "eval_map_50": 0.9639, - "eval_map_75": 0.8906, - "eval_map_chicken": 0.7829, - "eval_map_duck": 0.7456, - "eval_map_large": 0.8151, - "eval_map_medium": 0.8026, - "eval_map_plant": 0.865, - "eval_map_small": 0.342, - "eval_mar_1": 0.3163, - "eval_mar_10": 0.8364, - "eval_mar_100": 0.8416, - "eval_mar_100_chicken": 0.8278, - "eval_mar_100_duck": 0.7969, - "eval_mar_100_plant": 0.9, - "eval_mar_large": 0.8546, - "eval_mar_medium": 0.8452, - "eval_mar_small": 0.4348, - "eval_runtime": 13.5425, - "eval_samples_per_second": 7.384, - "eval_steps_per_second": 0.96, - "step": 71000 - }, - { - "epoch": 142.02, - "grad_norm": 43.489471435546875, - "learning_rate": 6.967096751758773e-08, - "loss": 0.4084, - "step": 71010 - }, - { - "epoch": 142.08, - "grad_norm": 116.61605072021484, - "learning_rate": 6.862961681428304e-08, - "loss": 0.2909, - "step": 71040 - }, - { - "epoch": 142.14, - "grad_norm": 74.62935638427734, - "learning_rate": 6.759605341792819e-08, - "loss": 0.3646, - "step": 71070 - }, - { - "epoch": 142.2, - "grad_norm": 78.06919860839844, - "learning_rate": 6.657027896065982e-08, - "loss": 0.3274, - "step": 71100 - }, - { - "epoch": 142.26, - "grad_norm": 145.50811767578125, - "learning_rate": 6.555229506231608e-08, - "loss": 0.3553, - "step": 71130 - }, - { - "epoch": 142.32, - "grad_norm": 86.26103973388672, - "learning_rate": 6.454210333043275e-08, - "loss": 0.4501, - "step": 71160 - }, - { - "epoch": 142.38, - "grad_norm": 156.82568359375, - "learning_rate": 6.353970536024045e-08, - "loss": 0.333, - "step": 71190 - }, - { - "epoch": 142.44, - "grad_norm": 103.7710952758789, - "learning_rate": 6.254510273466186e-08, - "loss": 0.3599, - "step": 71220 - }, - { - "epoch": 142.5, - "grad_norm": 61.770416259765625, - "learning_rate": 6.15582970243117e-08, - "loss": 0.345, - "step": 71250 - }, - { - "epoch": 142.56, - "grad_norm": 41.92399215698242, - "learning_rate": 6.057928978748906e-08, - "loss": 0.3872, - "step": 71280 - }, - { - "epoch": 142.62, - "grad_norm": 0.0001438482286175713, - "learning_rate": 5.960808257018113e-08, - "loss": 0.2993, - "step": 71310 - }, - { - "epoch": 142.68, - "grad_norm": 116.0578842163086, - "learning_rate": 5.864467690605613e-08, - "loss": 0.3742, - "step": 71340 - }, - { - "epoch": 142.74, - "grad_norm": 63.14453125, - "learning_rate": 5.76890743164632e-08, - "loss": 0.3473, - "step": 71370 - }, - { - "epoch": 142.8, - "grad_norm": 137.06199645996094, - "learning_rate": 5.674127631043025e-08, - "loss": 0.4043, - "step": 71400 - }, - { - "epoch": 142.86, - "grad_norm": 46.13239669799805, - "learning_rate": 5.580128438465837e-08, - "loss": 0.3086, - "step": 71430 - }, - { - "epoch": 142.92, - "grad_norm": 43.08638000488281, - "learning_rate": 5.4869100023523526e-08, - "loss": 0.3117, - "step": 71460 - }, - { - "epoch": 142.98, - "grad_norm": 87.1728286743164, - "learning_rate": 5.394472469907208e-08, - "loss": 0.302, - "step": 71490 - }, - { - "epoch": 143.0, - "eval_loss": 0.2861666977405548, - "eval_map": 0.8007, - "eval_map_50": 0.9638, - "eval_map_75": 0.8928, - "eval_map_chicken": 0.7869, - "eval_map_duck": 0.7467, - "eval_map_large": 0.8169, - "eval_map_medium": 0.8046, - "eval_map_plant": 0.8684, - "eval_map_small": 0.3448, - "eval_mar_1": 0.317, - "eval_mar_10": 0.8381, - "eval_mar_100": 0.8434, - "eval_mar_100_chicken": 0.831, - "eval_mar_100_duck": 0.7979, - "eval_mar_100_plant": 0.9012, - "eval_mar_large": 0.856, - "eval_mar_medium": 0.8472, - "eval_mar_small": 0.4348, - "eval_runtime": 13.8396, - "eval_samples_per_second": 7.226, - "eval_steps_per_second": 0.939, - "step": 71500 - }, - { - "epoch": 143.04, - "grad_norm": 69.2220687866211, - "learning_rate": 5.302815987101917e-08, - "loss": 0.4492, - "step": 71520 - }, - { - "epoch": 143.1, - "grad_norm": 33.27827835083008, - "learning_rate": 5.2119406986745336e-08, - "loss": 0.3843, - "step": 71550 - }, - { - "epoch": 143.16, - "grad_norm": 54.40850830078125, - "learning_rate": 5.121846748129544e-08, - "loss": 0.3944, - "step": 71580 - }, - { - "epoch": 143.22, - "grad_norm": 205.82879638671875, - "learning_rate": 5.032534277737644e-08, - "loss": 0.5238, - "step": 71610 - }, - { - "epoch": 143.28, - "grad_norm": 41.09965515136719, - "learning_rate": 4.944003428535349e-08, - "loss": 0.3828, - "step": 71640 - }, - { - "epoch": 143.34, - "grad_norm": 61.372779846191406, - "learning_rate": 4.856254340325051e-08, - "loss": 0.301, - "step": 71670 - }, - { - "epoch": 143.4, - "grad_norm": 86.27459716796875, - "learning_rate": 4.769287151674407e-08, - "loss": 0.3022, - "step": 71700 - }, - { - "epoch": 143.46, - "grad_norm": 38.24869918823242, - "learning_rate": 4.683101999916562e-08, - "loss": 0.361, - "step": 71730 - }, - { - "epoch": 143.52, - "grad_norm": 88.84414672851562, - "learning_rate": 4.597699021149649e-08, - "loss": 0.3642, - "step": 71760 - }, - { - "epoch": 143.58, - "grad_norm": 49.37421417236328, - "learning_rate": 4.5130783502365106e-08, - "loss": 0.3567, - "step": 71790 - }, - { - "epoch": 143.64, - "grad_norm": 53.82075500488281, - "learning_rate": 4.429240120804923e-08, - "loss": 0.4042, - "step": 71820 - }, - { - "epoch": 143.7, - "grad_norm": 43.972496032714844, - "learning_rate": 4.346184465246761e-08, - "loss": 0.347, - "step": 71850 - }, - { - "epoch": 143.76, - "grad_norm": 25.60863494873047, - "learning_rate": 4.263911514718222e-08, - "loss": 0.3437, - "step": 71880 - }, - { - "epoch": 143.82, - "grad_norm": 63.7047233581543, - "learning_rate": 4.1824213991396024e-08, - "loss": 0.3654, - "step": 71910 - }, - { - "epoch": 143.88, - "grad_norm": 32.8650016784668, - "learning_rate": 4.10171424719491e-08, - "loss": 0.3382, - "step": 71940 - }, - { - "epoch": 143.94, - "grad_norm": 91.05632019042969, - "learning_rate": 4.0217901863317534e-08, - "loss": 0.2996, - "step": 71970 - }, - { - "epoch": 144.0, - "grad_norm": 51.264190673828125, - "learning_rate": 3.9426493427611177e-08, - "loss": 0.3504, - "step": 72000 - }, - { - "epoch": 144.0, - "eval_loss": 0.2855512499809265, - "eval_map": 0.801, - "eval_map_50": 0.9638, - "eval_map_75": 0.8912, - "eval_map_chicken": 0.7856, - "eval_map_duck": 0.7486, - "eval_map_large": 0.8199, - "eval_map_medium": 0.8055, - "eval_map_plant": 0.8689, - "eval_map_small": 0.3394, - "eval_mar_1": 0.3177, - "eval_mar_10": 0.8392, - "eval_mar_100": 0.8445, - "eval_mar_100_chicken": 0.831, - "eval_mar_100_duck": 0.801, - "eval_mar_100_plant": 0.9015, - "eval_mar_large": 0.8576, - "eval_mar_medium": 0.8476, - "eval_mar_small": 0.4381, - "eval_runtime": 12.9118, - "eval_samples_per_second": 7.745, - "eval_steps_per_second": 1.007, - "step": 72000 - }, - { - "epoch": 144.06, - "grad_norm": 9.316276555182412e-05, - "learning_rate": 3.864291841457146e-08, - "loss": 0.3186, - "step": 72030 - }, - { - "epoch": 144.12, - "grad_norm": 78.5443344116211, - "learning_rate": 3.786717806157136e-08, - "loss": 0.3513, - "step": 72060 - }, - { - "epoch": 144.18, - "grad_norm": 114.05219268798828, - "learning_rate": 3.7099273593609316e-08, - "loss": 0.3342, - "step": 72090 - }, - { - "epoch": 144.24, - "grad_norm": 47.46656799316406, - "learning_rate": 3.633920622331311e-08, - "loss": 0.3796, - "step": 72120 - }, - { - "epoch": 144.3, - "grad_norm": 57.45075988769531, - "learning_rate": 3.558697715093207e-08, - "loss": 0.3123, - "step": 72150 - }, - { - "epoch": 144.36, - "grad_norm": 65.71527862548828, - "learning_rate": 3.4842587564337674e-08, - "loss": 0.3707, - "step": 72180 - }, - { - "epoch": 144.42, - "grad_norm": 9.118278831010684e-05, - "learning_rate": 3.410603863902406e-08, - "loss": 0.3521, - "step": 72210 - }, - { - "epoch": 144.48, - "grad_norm": 27.67734718322754, - "learning_rate": 3.337733153810141e-08, - "loss": 0.3518, - "step": 72240 - }, - { - "epoch": 144.54, - "grad_norm": 294.27203369140625, - "learning_rate": 3.2656467412298665e-08, - "loss": 0.2792, - "step": 72270 - }, - { - "epoch": 144.6, - "grad_norm": 41.44548797607422, - "learning_rate": 3.194344739995803e-08, - "loss": 0.3097, - "step": 72300 - }, - { - "epoch": 144.66, - "grad_norm": 36.42474365234375, - "learning_rate": 3.1238272627035494e-08, - "loss": 0.3046, - "step": 72330 - }, - { - "epoch": 144.72, - "grad_norm": 52.03242492675781, - "learning_rate": 3.054094420709863e-08, - "loss": 0.4278, - "step": 72360 - }, - { - "epoch": 144.78, - "grad_norm": 98.86956787109375, - "learning_rate": 2.985146324132438e-08, - "loss": 0.3682, - "step": 72390 - }, - { - "epoch": 144.84, - "grad_norm": 36.63032150268555, - "learning_rate": 2.9169830818496226e-08, - "loss": 0.377, - "step": 72420 - }, - { - "epoch": 144.9, - "grad_norm": 38.923377990722656, - "learning_rate": 2.8496048015005385e-08, - "loss": 0.3451, - "step": 72450 - }, - { - "epoch": 144.96, - "grad_norm": 75.13690948486328, - "learning_rate": 2.783011589484741e-08, - "loss": 0.3533, - "step": 72480 - }, - { - "epoch": 145.0, - "eval_loss": 0.2862549126148224, - "eval_map": 0.7992, - "eval_map_50": 0.9637, - "eval_map_75": 0.8912, - "eval_map_chicken": 0.7858, - "eval_map_duck": 0.7443, - "eval_map_large": 0.8154, - "eval_map_medium": 0.8055, - "eval_map_plant": 0.8676, - "eval_map_small": 0.3428, - "eval_mar_1": 0.3162, - "eval_mar_10": 0.8378, - "eval_mar_100": 0.8431, - "eval_mar_100_chicken": 0.831, - "eval_mar_100_duck": 0.7969, - "eval_mar_100_plant": 0.9015, - "eval_mar_large": 0.8551, - "eval_mar_medium": 0.8467, - "eval_mar_small": 0.4381, - "eval_runtime": 14.2646, - "eval_samples_per_second": 7.01, - "eval_steps_per_second": 0.911, - "step": 72500 - }, - { - "epoch": 145.02, - "grad_norm": 42.16242218017578, - "learning_rate": 2.7172035509619442e-08, - "loss": 0.3196, - "step": 72510 - }, - { - "epoch": 145.08, - "grad_norm": 77.00399780273438, - "learning_rate": 2.6521807898520214e-08, - "loss": 0.39, - "step": 72540 - }, - { - "epoch": 145.14, - "grad_norm": 90.41899108886719, - "learning_rate": 2.5879434088348364e-08, - "loss": 0.3079, - "step": 72570 - }, - { - "epoch": 145.2, - "grad_norm": 64.04692840576172, - "learning_rate": 2.5244915093499134e-08, - "loss": 0.3786, - "step": 72600 - }, - { - "epoch": 145.26, - "grad_norm": 75.01786804199219, - "learning_rate": 2.46182519159649e-08, - "loss": 0.4118, - "step": 72630 - }, - { - "epoch": 145.32, - "grad_norm": 36.48422622680664, - "learning_rate": 2.3999445545332955e-08, - "loss": 0.324, - "step": 72660 - }, - { - "epoch": 145.38, - "grad_norm": 31.995967864990234, - "learning_rate": 2.3388496958782203e-08, - "loss": 0.4274, - "step": 72690 - }, - { - "epoch": 145.44, - "grad_norm": 57.6303596496582, - "learning_rate": 2.2785407121084236e-08, - "loss": 0.3504, - "step": 72720 - }, - { - "epoch": 145.5, - "grad_norm": 38.874210357666016, - "learning_rate": 2.219017698460002e-08, - "loss": 0.53, - "step": 72750 - }, - { - "epoch": 145.56, - "grad_norm": 96.02101135253906, - "learning_rate": 2.1602807489279344e-08, - "loss": 0.3378, - "step": 72780 - }, - { - "epoch": 145.62, - "grad_norm": 114.84069061279297, - "learning_rate": 2.1023299562658584e-08, - "loss": 0.3171, - "step": 72810 - }, - { - "epoch": 145.68, - "grad_norm": 45.43848419189453, - "learning_rate": 2.0451654119860164e-08, - "loss": 0.3684, - "step": 72840 - }, - { - "epoch": 145.74, - "grad_norm": 65.03713989257812, - "learning_rate": 1.988787206359033e-08, - "loss": 0.3478, - "step": 72870 - }, - { - "epoch": 145.8, - "grad_norm": 0.00011910265311598778, - "learning_rate": 1.9331954284137476e-08, - "loss": 0.4666, - "step": 72900 - }, - { - "epoch": 145.86, - "grad_norm": 89.89669036865234, - "learning_rate": 1.8783901659372162e-08, - "loss": 0.4239, - "step": 72930 - }, - { - "epoch": 145.92, - "grad_norm": 90.59011840820312, - "learning_rate": 1.8243715054744315e-08, - "loss": 0.2945, - "step": 72960 - }, - { - "epoch": 145.98, - "grad_norm": 60.71207046508789, - "learning_rate": 1.7711395323281588e-08, - "loss": 0.3648, - "step": 72990 - }, - { - "epoch": 146.0, - "eval_loss": 0.28614741563796997, - "eval_map": 0.7987, - "eval_map_50": 0.9638, - "eval_map_75": 0.8913, - "eval_map_chicken": 0.7855, - "eval_map_duck": 0.7435, - "eval_map_large": 0.8153, - "eval_map_medium": 0.8047, - "eval_map_plant": 0.8672, - "eval_map_small": 0.3428, - "eval_mar_1": 0.3162, - "eval_mar_10": 0.8375, - "eval_mar_100": 0.8427, - "eval_mar_100_chicken": 0.831, - "eval_mar_100_duck": 0.7959, - "eval_mar_100_plant": 0.9012, - "eval_mar_large": 0.855, - "eval_mar_medium": 0.8463, - "eval_mar_small": 0.4381, - "eval_runtime": 12.7332, - "eval_samples_per_second": 7.853, - "eval_steps_per_second": 1.021, - "step": 73000 - }, - { - "epoch": 146.04, - "grad_norm": 76.41630554199219, - "learning_rate": 1.71869433055899e-08, - "loss": 0.4107, - "step": 73020 - }, - { - "epoch": 146.1, - "grad_norm": 32.97012710571289, - "learning_rate": 1.6670359829850657e-08, - "loss": 0.3645, - "step": 73050 - }, - { - "epoch": 146.16, - "grad_norm": 38.913429260253906, - "learning_rate": 1.6161645711819664e-08, - "loss": 0.2932, - "step": 73080 - }, - { - "epoch": 146.22, - "grad_norm": 60.343109130859375, - "learning_rate": 1.5660801754825983e-08, - "loss": 0.3342, - "step": 73110 - }, - { - "epoch": 146.28, - "grad_norm": 30.96074104309082, - "learning_rate": 1.5167828749770853e-08, - "loss": 0.3951, - "step": 73140 - }, - { - "epoch": 146.34, - "grad_norm": 81.41180419921875, - "learning_rate": 1.4682727475124891e-08, - "loss": 0.3341, - "step": 73170 - }, - { - "epoch": 146.4, - "grad_norm": 67.92564392089844, - "learning_rate": 1.4205498696930332e-08, - "loss": 0.2725, - "step": 73200 - }, - { - "epoch": 146.46, - "grad_norm": 8.548750338377431e-05, - "learning_rate": 1.3736143168796012e-08, - "loss": 0.3013, - "step": 73230 - }, - { - "epoch": 146.52, - "grad_norm": 81.73196411132812, - "learning_rate": 1.3274661631899055e-08, - "loss": 0.3924, - "step": 73260 - }, - { - "epoch": 146.58, - "grad_norm": 63.2492790222168, - "learning_rate": 1.2821054814980971e-08, - "loss": 0.4332, - "step": 73290 - }, - { - "epoch": 146.64, - "grad_norm": 40.29335021972656, - "learning_rate": 1.2375323434348773e-08, - "loss": 0.3949, - "step": 73320 - }, - { - "epoch": 146.7, - "grad_norm": 39.234066009521484, - "learning_rate": 1.1937468193873869e-08, - "loss": 0.3329, - "step": 73350 - }, - { - "epoch": 146.76, - "grad_norm": 42.852909088134766, - "learning_rate": 1.1507489784989278e-08, - "loss": 0.3865, - "step": 73380 - }, - { - "epoch": 146.82, - "grad_norm": 85.6583480834961, - "learning_rate": 1.1085388886689085e-08, - "loss": 0.3746, - "step": 73410 - }, - { - "epoch": 146.88, - "grad_norm": 68.23209381103516, - "learning_rate": 1.067116616552899e-08, - "loss": 0.2994, - "step": 73440 - }, - { - "epoch": 146.94, - "grad_norm": 43.73384475708008, - "learning_rate": 1.026482227562242e-08, - "loss": 0.3301, - "step": 73470 - }, - { - "epoch": 147.0, - "grad_norm": 66.02935791015625, - "learning_rate": 9.866357858642206e-09, - "loss": 0.3381, - "step": 73500 - }, - { - "epoch": 147.0, - "eval_loss": 0.2866884768009186, - "eval_map": 0.7996, - "eval_map_50": 0.9637, - "eval_map_75": 0.899, - "eval_map_chicken": 0.7846, - "eval_map_duck": 0.747, - "eval_map_large": 0.8153, - "eval_map_medium": 0.8053, - "eval_map_plant": 0.8672, - "eval_map_small": 0.3428, - "eval_mar_1": 0.3163, - "eval_mar_10": 0.8379, - "eval_mar_100": 0.8431, - "eval_mar_100_chicken": 0.8302, - "eval_mar_100_duck": 0.7979, - "eval_mar_100_plant": 0.9012, - "eval_mar_large": 0.8551, - "eval_mar_medium": 0.8464, - "eval_mar_small": 0.4381, - "eval_runtime": 13.1415, - "eval_samples_per_second": 7.609, - "eval_steps_per_second": 0.989, - "step": 73500 - }, - { - "epoch": 147.06, - "grad_norm": 43.25006103515625, - "learning_rate": 9.475773543818345e-09, - "loss": 0.3582, - "step": 73530 - }, - { - "epoch": 147.12, - "grad_norm": 121.3498306274414, - "learning_rate": 9.09306994793635e-09, - "loss": 0.3283, - "step": 73560 - }, - { - "epoch": 147.18, - "grad_norm": 90.53949737548828, - "learning_rate": 8.718247675337243e-09, - "loss": 0.3048, - "step": 73590 - }, - { - "epoch": 147.24, - "grad_norm": 49.60541915893555, - "learning_rate": 8.351307317917002e-09, - "loss": 0.3482, - "step": 73620 - }, - { - "epoch": 147.3, - "grad_norm": 43.89070129394531, - "learning_rate": 7.992249455124889e-09, - "loss": 0.3535, - "step": 73650 - }, - { - "epoch": 147.36, - "grad_norm": 46.422210693359375, - "learning_rate": 7.641074653961244e-09, - "loss": 0.3618, - "step": 73680 - }, - { - "epoch": 147.42, - "grad_norm": 72.29833221435547, - "learning_rate": 7.297783468980246e-09, - "loss": 0.3872, - "step": 73710 - }, - { - "epoch": 147.48, - "grad_norm": 80.47969818115234, - "learning_rate": 6.962376442284368e-09, - "loss": 0.3651, - "step": 73740 - }, - { - "epoch": 147.54, - "grad_norm": 26.379911422729492, - "learning_rate": 6.63485410352771e-09, - "loss": 0.3639, - "step": 73770 - }, - { - "epoch": 147.6, - "grad_norm": 76.38525390625, - "learning_rate": 6.315216969912663e-09, - "loss": 0.3108, - "step": 73800 - }, - { - "epoch": 147.66, - "grad_norm": 71.98011016845703, - "learning_rate": 6.003465546189358e-09, - "loss": 0.387, - "step": 73830 - }, - { - "epoch": 147.72, - "grad_norm": 34.25730895996094, - "learning_rate": 5.699600324657328e-09, - "loss": 0.3608, - "step": 73860 - }, - { - "epoch": 147.78, - "grad_norm": 68.7569351196289, - "learning_rate": 5.403621785159407e-09, - "loss": 0.3832, - "step": 73890 - }, - { - "epoch": 147.84, - "grad_norm": 44.0081787109375, - "learning_rate": 5.115530395087276e-09, - "loss": 0.3973, - "step": 73920 - }, - { - "epoch": 147.9, - "grad_norm": 36.869285583496094, - "learning_rate": 4.835326609376468e-09, - "loss": 0.3676, - "step": 73950 - }, - { - "epoch": 147.96, - "grad_norm": 36.048248291015625, - "learning_rate": 4.5630108705063684e-09, - "loss": 0.3483, - "step": 73980 - }, - { - "epoch": 148.0, - "eval_loss": 0.28642600774765015, - "eval_map": 0.7995, - "eval_map_50": 0.9637, - "eval_map_75": 0.8989, - "eval_map_chicken": 0.7833, - "eval_map_duck": 0.748, - "eval_map_large": 0.8153, - "eval_map_medium": 0.8055, - "eval_map_plant": 0.8672, - "eval_map_small": 0.3457, - "eval_mar_1": 0.3165, - "eval_mar_10": 0.8381, - "eval_mar_100": 0.8433, - "eval_mar_100_chicken": 0.8298, - "eval_mar_100_duck": 0.799, - "eval_mar_100_plant": 0.9012, - "eval_mar_large": 0.8551, - "eval_mar_medium": 0.8467, - "eval_mar_small": 0.4381, - "eval_runtime": 13.1492, - "eval_samples_per_second": 7.605, - "eval_steps_per_second": 0.989, - "step": 74000 - }, - { - "epoch": 148.02, - "grad_norm": 91.10087585449219, - "learning_rate": 4.298583608501328e-09, - "loss": 0.3597, - "step": 74010 - }, - { - "epoch": 148.08, - "grad_norm": 36.6383056640625, - "learning_rate": 4.042045240927883e-09, - "loss": 0.3727, - "step": 74040 - }, - { - "epoch": 148.14, - "grad_norm": 58.12496566772461, - "learning_rate": 3.793396172895314e-09, - "loss": 0.3224, - "step": 74070 - }, - { - "epoch": 148.2, - "grad_norm": 49.23323440551758, - "learning_rate": 3.5526367970539765e-09, - "loss": 0.3254, - "step": 74100 - }, - { - "epoch": 148.26, - "grad_norm": 31.846426010131836, - "learning_rate": 3.31976749359586e-09, - "loss": 0.4167, - "step": 74130 - }, - { - "epoch": 148.32, - "grad_norm": 54.62555694580078, - "learning_rate": 3.094788630254031e-09, - "loss": 0.3653, - "step": 74160 - }, - { - "epoch": 148.38, - "grad_norm": 46.62826156616211, - "learning_rate": 2.8777005622998567e-09, - "loss": 0.3153, - "step": 74190 - }, - { - "epoch": 148.44, - "grad_norm": 70.24339294433594, - "learning_rate": 2.6685036325457826e-09, - "loss": 0.3971, - "step": 74220 - }, - { - "epoch": 148.5, - "grad_norm": 158.49122619628906, - "learning_rate": 2.4671981713420003e-09, - "loss": 0.4025, - "step": 74250 - }, - { - "epoch": 148.56, - "grad_norm": 62.34785461425781, - "learning_rate": 2.2737844965775578e-09, - "loss": 0.3126, - "step": 74280 - }, - { - "epoch": 148.62, - "grad_norm": 226.48269653320312, - "learning_rate": 2.088262913679251e-09, - "loss": 0.337, - "step": 74310 - }, - { - "epoch": 148.68, - "grad_norm": 81.87285614013672, - "learning_rate": 1.9106337156099553e-09, - "loss": 0.3815, - "step": 74340 - }, - { - "epoch": 148.74, - "grad_norm": 57.122100830078125, - "learning_rate": 1.740897182871404e-09, - "loss": 0.4246, - "step": 74370 - }, - { - "epoch": 148.8, - "grad_norm": 56.535484313964844, - "learning_rate": 1.5790535835003006e-09, - "loss": 0.4102, - "step": 74400 - }, - { - "epoch": 148.86, - "grad_norm": 40.1457405090332, - "learning_rate": 1.425103173069986e-09, - "loss": 0.3297, - "step": 74430 - }, - { - "epoch": 148.92, - "grad_norm": 95.99275207519531, - "learning_rate": 1.2790461946887712e-09, - "loss": 0.2953, - "step": 74460 - }, - { - "epoch": 148.98, - "grad_norm": 57.88656234741211, - "learning_rate": 1.1408828790010484e-09, - "loss": 0.3674, - "step": 74490 - }, - { - "epoch": 149.0, - "eval_loss": 0.2863713502883911, - "eval_map": 0.7992, - "eval_map_50": 0.9637, - "eval_map_75": 0.8989, - "eval_map_chicken": 0.7833, - "eval_map_duck": 0.747, - "eval_map_large": 0.8153, - "eval_map_medium": 0.8051, - "eval_map_plant": 0.8672, - "eval_map_small": 0.3428, - "eval_mar_1": 0.3162, - "eval_mar_10": 0.8378, - "eval_mar_100": 0.843, - "eval_mar_100_chicken": 0.8298, - "eval_mar_100_duck": 0.7979, - "eval_mar_100_plant": 0.9012, - "eval_mar_large": 0.8551, - "eval_mar_medium": 0.8463, - "eval_mar_small": 0.4381, - "eval_runtime": 14.0272, - "eval_samples_per_second": 7.129, - "eval_steps_per_second": 0.927, - "step": 74500 } ], "logging_steps": 30, @@ -21281,7 +10008,7 @@ "attributes": {} } }, - "total_flos": 2.56297219117056e+19, + "total_flos": 1.2040808951808e+19, "train_batch_size": 2, "trial_name": null, "trial_params": null