{ "best_metric": 3.5358800888061523, "best_model_checkpoint": "/mnt/output/projects/sca-xiaoke-v3/amlt-results/7300886566.81622-380c5407-4540-4a74-b6ec-7def0683f098/checkpoint-185000", "epoch": 82.67879288962381, "global_step": 200000, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "_prepare_inputs_in_ms": 10.839506983757019, "compute_loss_in_ms": 1584.6049636602402, "epoch": 0.0, "learning_rate/full": 0.0, "loss": 8.622, "step": 1, "training_step_in_ms": 2253.9908327162266 }, { "epoch": 0.0, "eval_visual_genome-densecap-local-densecap-test_loss": 8.927019119262695, "eval_visual_genome-densecap-local-densecap-test_meteor": 0.023580759441051608, "eval_visual_genome-densecap-local-densecap-test_runtime": 150.659, "eval_visual_genome-densecap-local-densecap-test_samples_per_second": 5.31, "eval_visual_genome-densecap-local-densecap-test_steps_per_second": 0.166, "step": 1 }, { "_prepare_inputs_in_ms": 4.052688444062369, "compute_loss_in_ms": 266.6276198354092, "epoch": 0.41, "learning_rate/full": 0.0003999851506717227, "loss": 4.9777, "step": 1000, "training_step_in_ms": 963.7469428184035 }, { "_prepare_inputs_in_ms": 4.001575957983732, "compute_loss_in_ms": 266.9940203540027, "epoch": 0.83, "learning_rate/full": 0.0003999221107895784, "loss": 4.4794, "step": 2000, "training_step_in_ms": 964.067553780973 }, { "_prepare_inputs_in_ms": 4.017723824828863, "compute_loss_in_ms": 266.8530354350805, "epoch": 1.24, "learning_rate/full": 0.0003998096443163716, "loss": 4.3589, "step": 3000, "training_step_in_ms": 964.8137692287564 }, { "_prepare_inputs_in_ms": 3.9884973876178265, "compute_loss_in_ms": 266.8117158599198, "epoch": 1.65, "learning_rate/full": 0.0003996477790571026, "loss": 4.2668, "step": 4000, "training_step_in_ms": 963.3689811453223 }, { "_prepare_inputs_in_ms": 4.001692395657301, "compute_loss_in_ms": 267.8194024413824, "epoch": 2.07, "learning_rate/full": 0.0003994365550295963, "loss": 4.2092, "step": 5000, "training_step_in_ms": 965.0005767121911 }, { "epoch": 2.07, "eval_visual_genome-densecap-local-densecap-test_loss": 4.066258430480957, "eval_visual_genome-densecap-local-densecap-test_meteor": 0.19624665436714503, "eval_visual_genome-densecap-local-densecap-test_runtime": 81.5743, "eval_visual_genome-densecap-local-densecap-test_samples_per_second": 9.807, "eval_visual_genome-densecap-local-densecap-test_steps_per_second": 0.306, "step": 5000 }, { "_prepare_inputs_in_ms": 4.123009167066434, "compute_loss_in_ms": 267.90184961631894, "epoch": 2.48, "learning_rate/full": 0.0003991760244546079, "loss": 4.1535, "step": 6000, "training_step_in_ms": 963.1004312746227 }, { "_prepare_inputs_in_ms": 4.096908804029226, "compute_loss_in_ms": 268.2109449021518, "epoch": 2.89, "learning_rate/full": 0.00039886625174291286, "loss": 4.1103, "step": 7000, "training_step_in_ms": 965.0139690972865 }, { "_prepare_inputs_in_ms": 4.150357250124216, "compute_loss_in_ms": 269.2836431860924, "epoch": 3.31, "learning_rate/full": 0.0003985073134793826, "loss": 4.0761, "step": 8000, "training_step_in_ms": 969.6529387235641 }, { "_prepare_inputs_in_ms": 4.171766873449087, "compute_loss_in_ms": 268.9554896838963, "epoch": 3.72, "learning_rate/full": 0.00039809973090042857, "loss": 4.0582, "step": 9000, "training_step_in_ms": 964.8072783201933 }, { "_prepare_inputs_in_ms": 4.219205696135759, "compute_loss_in_ms": 268.6923326961696, "epoch": 4.13, "learning_rate/full": 0.00039764327017710485, "loss": 4.0324, "step": 10000, "training_step_in_ms": 962.4501793310046 }, { "epoch": 4.13, "eval_visual_genome-densecap-local-densecap-test_loss": 3.913562059402466, "eval_visual_genome-densecap-local-densecap-test_meteor": 0.22121572228147113, "eval_visual_genome-densecap-local-densecap-test_runtime": 79.9476, "eval_visual_genome-densecap-local-densecap-test_samples_per_second": 10.007, "eval_visual_genome-densecap-local-densecap-test_steps_per_second": 0.313, "step": 10000 }, { "_prepare_inputs_in_ms": 4.152017308444512, "compute_loss_in_ms": 268.094536613673, "epoch": 4.55, "learning_rate/full": 0.0003971380439342646, "loss": 4.0153, "step": 11000, "training_step_in_ms": 964.2485933154821 }, { "_prepare_inputs_in_ms": 4.1431227289140224, "compute_loss_in_ms": 268.42261432111263, "epoch": 4.96, "learning_rate/full": 0.00039658359808291836, "loss": 4.0053, "step": 12000, "training_step_in_ms": 965.7689935192466 }, { "_prepare_inputs_in_ms": 4.223931197077036, "compute_loss_in_ms": 268.6585740670562, "epoch": 5.37, "learning_rate/full": 0.00039598117829320827, "loss": 3.9802, "step": 13000, "training_step_in_ms": 960.5111146196723 }, { "_prepare_inputs_in_ms": 4.1840940825641155, "compute_loss_in_ms": 268.2862157560885, "epoch": 5.79, "learning_rate/full": 0.00039533040308028367, "loss": 3.9633, "step": 14000, "training_step_in_ms": 968.1838200092316 }, { "_prepare_inputs_in_ms": 4.200506843626499, "compute_loss_in_ms": 268.91191502287984, "epoch": 6.2, "learning_rate/full": 0.0003946307092543998, "loss": 3.941, "step": 15000, "training_step_in_ms": 968.3050900287926 }, { "epoch": 6.2, "eval_visual_genome-densecap-local-densecap-test_loss": 3.8218424320220947, "eval_visual_genome-densecap-local-densecap-test_meteor": 0.2321593168121597, "eval_visual_genome-densecap-local-densecap-test_runtime": 78.2057, "eval_visual_genome-densecap-local-densecap-test_samples_per_second": 10.229, "eval_visual_genome-densecap-local-densecap-test_steps_per_second": 0.32, "step": 15000 }, { "_prepare_inputs_in_ms": 4.21836834491753, "compute_loss_in_ms": 268.7001321054995, "epoch": 6.61, "learning_rate/full": 0.0003938844405523341, "loss": 3.9323, "step": 16000, "training_step_in_ms": 984.531311199069 }, { "_prepare_inputs_in_ms": 4.2030105367302895, "compute_loss_in_ms": 268.3060254715383, "epoch": 7.03, "learning_rate/full": 0.00039308879047835453, "loss": 3.9216, "step": 17000, "training_step_in_ms": 961.8699175454676 }, { "_prepare_inputs_in_ms": 4.2327940091490746, "compute_loss_in_ms": 269.27323868498206, "epoch": 7.44, "learning_rate/full": 0.00039224627037346294, "loss": 3.8992, "step": 18000, "training_step_in_ms": 967.632270719856 }, { "_prepare_inputs_in_ms": 4.229459121823311, "compute_loss_in_ms": 268.5666101500392, "epoch": 7.85, "learning_rate/full": 0.00039135631637799936, "loss": 3.8984, "step": 19000, "training_step_in_ms": 963.238344412297 }, { "_prepare_inputs_in_ms": 4.240339521318674, "compute_loss_in_ms": 268.11582005023956, "epoch": 8.27, "learning_rate/full": 0.00039041818639024787, "loss": 3.8907, "step": 20000, "training_step_in_ms": 960.5583217255771 }, { "epoch": 8.27, "eval_visual_genome-densecap-local-densecap-test_loss": 3.7651355266571045, "eval_visual_genome-densecap-local-densecap-test_meteor": 0.2403944760451539, "eval_visual_genome-densecap-local-densecap-test_runtime": 80.0701, "eval_visual_genome-densecap-local-densecap-test_samples_per_second": 9.991, "eval_visual_genome-densecap-local-densecap-test_steps_per_second": 0.312, "step": 20000 }, { "_prepare_inputs_in_ms": 4.2025597829644274, "compute_loss_in_ms": 267.9062583371997, "epoch": 8.68, "learning_rate/full": 0.00038943398810118026, "loss": 3.8736, "step": 21000, "training_step_in_ms": 962.8509967587888 }, { "_prepare_inputs_in_ms": 4.1947984509170055, "compute_loss_in_ms": 268.05593667179346, "epoch": 9.09, "learning_rate/full": 0.00038840304981011036, "loss": 3.8689, "step": 22000, "training_step_in_ms": 965.0497910194099 }, { "_prepare_inputs_in_ms": 4.219467684626579, "compute_loss_in_ms": 268.2473221644759, "epoch": 9.51, "learning_rate/full": 0.0003873256258856351, "loss": 3.8553, "step": 23000, "training_step_in_ms": 967.3452698886395 }, { "_prepare_inputs_in_ms": 4.203684389591217, "compute_loss_in_ms": 268.0240872502327, "epoch": 9.92, "learning_rate/full": 0.00038620312995292836, "loss": 3.8464, "step": 24000, "training_step_in_ms": 960.33872378245 }, { "_prepare_inputs_in_ms": 4.218942817300558, "compute_loss_in_ms": 268.9947931431234, "epoch": 10.33, "learning_rate/full": 0.0003850323958934377, "loss": 3.8356, "step": 25000, "training_step_in_ms": 967.6199573352933 }, { "epoch": 10.33, "eval_visual_genome-densecap-local-densecap-test_loss": 3.71928071975708, "eval_visual_genome-densecap-local-densecap-test_meteor": 0.24336343080593542, "eval_visual_genome-densecap-local-densecap-test_runtime": 79.8751, "eval_visual_genome-densecap-local-densecap-test_samples_per_second": 10.016, "eval_visual_genome-densecap-local-densecap-test_steps_per_second": 0.313, "step": 25000 }, { "_prepare_inputs_in_ms": 4.202740984718974, "compute_loss_in_ms": 268.5807599723339, "epoch": 10.75, "learning_rate/full": 0.0003838183948306088, "loss": 3.8328, "step": 26000, "training_step_in_ms": 961.2188336364925 }, { "_prepare_inputs_in_ms": 4.2269067615270615, "compute_loss_in_ms": 267.7264535538852, "epoch": 11.16, "learning_rate/full": 0.00038255656126572534, "loss": 3.8214, "step": 27000, "training_step_in_ms": 960.6881345175207 }, { "_prepare_inputs_in_ms": 4.240487921983004, "compute_loss_in_ms": 268.31112349405885, "epoch": 11.58, "learning_rate/full": 0.00038125092378570903, "loss": 3.8196, "step": 28000, "training_step_in_ms": 964.0034716315567 }, { "_prepare_inputs_in_ms": 4.273211572319269, "compute_loss_in_ms": 268.9577633589506, "epoch": 11.99, "learning_rate/full": 0.0003798991913473777, "loss": 3.8171, "step": 29000, "training_step_in_ms": 973.0124748162925 }, { "_prepare_inputs_in_ms": 4.244079362601042, "compute_loss_in_ms": 267.9022591896355, "epoch": 12.4, "learning_rate/full": 0.0003785058191464291, "loss": 3.8013, "step": 30000, "training_step_in_ms": 962.8623519428074 }, { "epoch": 12.4, "eval_visual_genome-densecap-local-densecap-test_loss": 3.687087297439575, "eval_visual_genome-densecap-local-densecap-test_meteor": 0.24789182257436765, "eval_visual_genome-densecap-local-densecap-test_runtime": 78.5068, "eval_visual_genome-densecap-local-densecap-test_samples_per_second": 10.19, "eval_visual_genome-densecap-local-densecap-test_steps_per_second": 0.318, "step": 30000 }, { "_prepare_inputs_in_ms": 4.183955312502094, "compute_loss_in_ms": 267.3523456119001, "epoch": 12.82, "learning_rate/full": 0.00037706702930065926, "loss": 3.8065, "step": 31000, "training_step_in_ms": 957.8949020504951 }, { "_prepare_inputs_in_ms": 4.198232229799032, "compute_loss_in_ms": 267.4514962993562, "epoch": 13.23, "learning_rate/full": 0.0003755830450857345, "loss": 3.7986, "step": 32000, "training_step_in_ms": 963.8669461458921 }, { "_prepare_inputs_in_ms": 4.18659433722496, "compute_loss_in_ms": 268.10614936053753, "epoch": 13.64, "learning_rate/full": 0.0003740572005600189, "loss": 3.7923, "step": 33000, "training_step_in_ms": 965.2572022378445 }, { "_prepare_inputs_in_ms": 4.225778687745333, "compute_loss_in_ms": 268.18950264155865, "epoch": 14.06, "learning_rate/full": 0.00037248681827609586, "loss": 3.7947, "step": 34000, "training_step_in_ms": 960.6446040645242 }, { "_prepare_inputs_in_ms": 4.189065434038639, "compute_loss_in_ms": 267.6565695255995, "epoch": 14.47, "learning_rate/full": 0.00037087542640234865, "loss": 3.7849, "step": 35000, "training_step_in_ms": 964.44107465446 }, { "epoch": 14.47, "eval_visual_genome-densecap-local-densecap-test_loss": 3.6763927936553955, "eval_visual_genome-densecap-local-densecap-test_meteor": 0.246958162767791, "eval_visual_genome-densecap-local-densecap-test_runtime": 77.6323, "eval_visual_genome-densecap-local-densecap-test_samples_per_second": 10.305, "eval_visual_genome-densecap-local-densecap-test_steps_per_second": 0.322, "step": 35000 }, { "_prepare_inputs_in_ms": 4.164576116131573, "compute_loss_in_ms": 267.3913585655391, "epoch": 14.88, "learning_rate/full": 0.0003692218735740006, "loss": 3.7838, "step": 36000, "training_step_in_ms": 965.0988348089159 }, { "_prepare_inputs_in_ms": 4.195226285606623, "compute_loss_in_ms": 268.244338080287, "epoch": 15.3, "learning_rate/full": 0.00036752484999829976, "loss": 3.7779, "step": 37000, "training_step_in_ms": 966.1850301101804 }, { "_prepare_inputs_in_ms": 4.189992021769285, "compute_loss_in_ms": 267.8583819307387, "epoch": 15.71, "learning_rate/full": 0.0003657881683678541, "loss": 3.7748, "step": 38000, "training_step_in_ms": 963.9664278812706 }, { "_prepare_inputs_in_ms": 4.199680101126432, "compute_loss_in_ms": 268.06280748173594, "epoch": 16.12, "learning_rate/full": 0.00036401058098760525, "loss": 3.7695, "step": 39000, "training_step_in_ms": 967.5451415590942 }, { "_prepare_inputs_in_ms": 4.182811006903648, "compute_loss_in_ms": 267.7034317664802, "epoch": 16.54, "learning_rate/full": 0.00036219252645064074, "loss": 3.7688, "step": 40000, "training_step_in_ms": 967.6426770947874 }, { "epoch": 16.54, "eval_visual_genome-densecap-local-densecap-test_loss": 3.658348321914673, "eval_visual_genome-densecap-local-densecap-test_meteor": 0.25104865208221006, "eval_visual_genome-densecap-local-densecap-test_runtime": 77.4516, "eval_visual_genome-densecap-local-densecap-test_samples_per_second": 10.329, "eval_visual_genome-densecap-local-densecap-test_steps_per_second": 0.323, "step": 40000 }, { "_prepare_inputs_in_ms": 4.188235598366435, "compute_loss_in_ms": 267.2028581239283, "epoch": 16.95, "learning_rate/full": 0.0003603344533347134, "loss": 3.761, "step": 41000, "training_step_in_ms": 958.9369925446808 }, { "_prepare_inputs_in_ms": 4.214274771511555, "compute_loss_in_ms": 267.64739087969065, "epoch": 17.36, "learning_rate/full": 0.00035843490089475537, "loss": 3.7527, "step": 42000, "training_step_in_ms": 966.9140360169113 }, { "_prepare_inputs_in_ms": 4.22203628346324, "compute_loss_in_ms": 268.2027486599982, "epoch": 17.78, "learning_rate/full": 0.00035650009493379324, "loss": 3.7569, "step": 43000, "training_step_in_ms": 965.1608090028167 }, { "_prepare_inputs_in_ms": 4.219520688056946, "compute_loss_in_ms": 268.0517144687474, "epoch": 18.19, "learning_rate/full": 0.00035452275921920933, "loss": 3.7513, "step": 44000, "training_step_in_ms": 965.6609862968326 }, { "_prepare_inputs_in_ms": 4.1790814362466335, "compute_loss_in_ms": 267.46442713588476, "epoch": 18.6, "learning_rate/full": 0.0003525092554160055, "loss": 3.7467, "step": 45000, "training_step_in_ms": 965.7583395838737 }, { "epoch": 18.6, "eval_visual_genome-densecap-local-densecap-test_loss": 3.6469690799713135, "eval_visual_genome-densecap-local-densecap-test_meteor": 0.25092950859358, "eval_visual_genome-densecap-local-densecap-test_runtime": 78.5468, "eval_visual_genome-densecap-local-densecap-test_samples_per_second": 10.185, "eval_visual_genome-densecap-local-densecap-test_steps_per_second": 0.318, "step": 45000 }, { "_prepare_inputs_in_ms": 4.220321690890847, "compute_loss_in_ms": 267.56717593222857, "epoch": 19.02, "learning_rate/full": 0.0003504601940692656, "loss": 3.7497, "step": 46000, "training_step_in_ms": 964.2354487106204 }, { "_prepare_inputs_in_ms": 4.205725617706776, "compute_loss_in_ms": 268.48560455814004, "epoch": 19.43, "learning_rate/full": 0.0003483698657658315, "loss": 3.7388, "step": 47000, "training_step_in_ms": 967.1772802136838 }, { "_prepare_inputs_in_ms": 4.253620557487011, "compute_loss_in_ms": 267.8220782019198, "epoch": 19.84, "learning_rate/full": 0.0003462450012513184, "loss": 3.744, "step": 48000, "training_step_in_ms": 962.239847779274 }, { "_prepare_inputs_in_ms": 4.241022698581219, "compute_loss_in_ms": 268.39736769348383, "epoch": 20.26, "learning_rate/full": 0.00034408405297105753, "loss": 3.7372, "step": 49000, "training_step_in_ms": 966.1254425011575 }, { "_prepare_inputs_in_ms": 4.21300457790494, "compute_loss_in_ms": 268.7097208276391, "epoch": 20.67, "learning_rate/full": 0.0003418853377786221, "loss": 3.7334, "step": 50000, "training_step_in_ms": 968.8591329194605 }, { "epoch": 20.67, "eval_visual_genome-densecap-local-densecap-test_loss": 3.632450580596924, "eval_visual_genome-densecap-local-densecap-test_meteor": 0.253658040934189, "eval_visual_genome-densecap-local-densecap-test_runtime": 77.9084, "eval_visual_genome-densecap-local-densecap-test_samples_per_second": 10.268, "eval_visual_genome-densecap-local-densecap-test_steps_per_second": 0.321, "step": 50000 }, { "_prepare_inputs_in_ms": 4.228368219805927, "compute_loss_in_ms": 268.4243040457368, "epoch": 21.08, "learning_rate/full": 0.0003396560466114797, "loss": 3.7438, "step": 51000, "training_step_in_ms": 964.8838895820081 }, { "_prepare_inputs_in_ms": 4.233973186463118, "compute_loss_in_ms": 268.22105176746845, "epoch": 21.5, "learning_rate/full": 0.0003373900810764743, "loss": 3.728, "step": 52000, "training_step_in_ms": 962.5837270207703 }, { "_prepare_inputs_in_ms": 4.230040587484837, "compute_loss_in_ms": 267.9561189264059, "epoch": 21.91, "learning_rate/full": 0.0003350878976336386, "loss": 3.7287, "step": 53000, "training_step_in_ms": 964.1780665256083 }, { "_prepare_inputs_in_ms": 4.2476331405341625, "compute_loss_in_ms": 268.6795903816819, "epoch": 22.32, "learning_rate/full": 0.0003327546685845955, "loss": 3.7223, "step": 54000, "training_step_in_ms": 967.9701336547732 }, { "_prepare_inputs_in_ms": 4.220093585550785, "compute_loss_in_ms": 267.76603213325143, "epoch": 22.74, "learning_rate/full": 0.00033038868430752995, "loss": 3.7261, "step": 55000, "training_step_in_ms": 962.9226383566856 }, { "epoch": 22.74, "eval_visual_genome-densecap-local-densecap-test_loss": 3.6242456436157227, "eval_visual_genome-densecap-local-densecap-test_meteor": 0.25521777862203787, "eval_visual_genome-densecap-local-densecap-test_runtime": 78.5774, "eval_visual_genome-densecap-local-densecap-test_samples_per_second": 10.181, "eval_visual_genome-densecap-local-densecap-test_steps_per_second": 0.318, "step": 55000 }, { "_prepare_inputs_in_ms": 4.227604019205745, "compute_loss_in_ms": 267.647510971874, "epoch": 23.15, "learning_rate/full": 0.00032799052857365924, "loss": 3.7232, "step": 56000, "training_step_in_ms": 963.1331409327686 }, { "_prepare_inputs_in_ms": 4.1824629083275795, "compute_loss_in_ms": 267.5452450104058, "epoch": 23.56, "learning_rate/full": 0.0003255583453025672, "loss": 3.7153, "step": 57000, "training_step_in_ms": 965.8048706538975 }, { "_prepare_inputs_in_ms": 4.190924048423767, "compute_loss_in_ms": 268.4611966535449, "epoch": 23.98, "learning_rate/full": 0.0003230975988657048, "loss": 3.72, "step": 58000, "training_step_in_ms": 965.0302759557962 }, { "_prepare_inputs_in_ms": 4.20093110203743, "compute_loss_in_ms": 267.884086355567, "epoch": 24.39, "learning_rate/full": 0.0003206064799382713, "loss": 3.7127, "step": 59000, "training_step_in_ms": 964.0987507812679 }, { "_prepare_inputs_in_ms": 4.210771672427654, "compute_loss_in_ms": 267.6700286902487, "epoch": 24.8, "learning_rate/full": 0.00031808560316658635, "loss": 3.7115, "step": 60000, "training_step_in_ms": 965.6994955539703 }, { "epoch": 24.8, "eval_visual_genome-densecap-local-densecap-test_loss": 3.61262583732605, "eval_visual_genome-densecap-local-densecap-test_meteor": 0.259026039077661, "eval_visual_genome-densecap-local-densecap-test_runtime": 77.8405, "eval_visual_genome-densecap-local-densecap-test_samples_per_second": 10.277, "eval_visual_genome-densecap-local-densecap-test_steps_per_second": 0.321, "step": 60000 }, { "_prepare_inputs_in_ms": 4.141795973225338, "compute_loss_in_ms": 267.2422932982445, "epoch": 25.22, "learning_rate/full": 0.0003155330235866319, "loss": 3.7085, "step": 61000, "training_step_in_ms": 965.9709356427193 }, { "_prepare_inputs_in_ms": 4.12061008810997, "compute_loss_in_ms": 268.04699283093214, "epoch": 25.63, "learning_rate/full": 0.000312954476063518, "loss": 3.7031, "step": 62000, "training_step_in_ms": 964.8432326950133 }, { "_prepare_inputs_in_ms": 4.14773878082633, "compute_loss_in_ms": 268.0800936706364, "epoch": 26.04, "learning_rate/full": 0.00031035068146119334, "loss": 3.7053, "step": 63000, "training_step_in_ms": 964.9066540151834 }, { "_prepare_inputs_in_ms": 4.157721221446991, "compute_loss_in_ms": 267.8991154767573, "epoch": 26.46, "learning_rate/full": 0.00030771441463138695, "loss": 3.6991, "step": 64000, "training_step_in_ms": 966.7548437044024 }, { "_prepare_inputs_in_ms": 4.127573002129793, "compute_loss_in_ms": 268.0769842043519, "epoch": 26.87, "learning_rate/full": 0.00030505419362911944, "loss": 3.7026, "step": 65000, "training_step_in_ms": 966.6518254801631 }, { "epoch": 26.87, "eval_visual_genome-densecap-local-densecap-test_loss": 3.604250907897949, "eval_visual_genome-densecap-local-densecap-test_meteor": 0.2600293381296915, "eval_visual_genome-densecap-local-densecap-test_runtime": 77.2046, "eval_visual_genome-densecap-local-densecap-test_samples_per_second": 10.362, "eval_visual_genome-densecap-local-densecap-test_steps_per_second": 0.324, "step": 65000 }, { "_prepare_inputs_in_ms": 4.138722216210714, "compute_loss_in_ms": 268.0730670392513, "epoch": 27.28, "learning_rate/full": 0.0003023653504808654, "loss": 3.6903, "step": 66000, "training_step_in_ms": 965.3969647027552 }, { "_prepare_inputs_in_ms": 4.153087247163057, "compute_loss_in_ms": 268.1363028138876, "epoch": 27.7, "learning_rate/full": 0.0002996566527388639, "loss": 3.6969, "step": 67000, "training_step_in_ms": 965.2745163962245 }, { "_prepare_inputs_in_ms": 4.149796262383461, "compute_loss_in_ms": 267.83912086486816, "epoch": 28.11, "learning_rate/full": 0.0002969179137925403, "loss": 3.6937, "step": 68000, "training_step_in_ms": 968.0436515249312 }, { "_prepare_inputs_in_ms": 4.1318743117153645, "compute_loss_in_ms": 268.5812944062054, "epoch": 28.52, "learning_rate/full": 0.0002941579883457959, "loss": 3.6891, "step": 69000, "training_step_in_ms": 964.7220857255161 }, { "_prepare_inputs_in_ms": 4.13500452041626, "compute_loss_in_ms": 267.81502260267735, "epoch": 28.94, "learning_rate/full": 0.0002913748308243434, "loss": 3.6864, "step": 70000, "training_step_in_ms": 964.9831298328936 }, { "epoch": 28.94, "eval_visual_genome-densecap-local-densecap-test_loss": 3.5996363162994385, "eval_visual_genome-densecap-local-densecap-test_meteor": 0.26106738202465474, "eval_visual_genome-densecap-local-densecap-test_runtime": 79.1905, "eval_visual_genome-densecap-local-densecap-test_samples_per_second": 10.102, "eval_visual_genome-densecap-local-densecap-test_steps_per_second": 0.316, "step": 70000 }, { "_prepare_inputs_in_ms": 4.127892008641871, "compute_loss_in_ms": 267.3319378942251, "epoch": 29.35, "learning_rate/full": 0.000288569127930656, "loss": 3.6864, "step": 71000, "training_step_in_ms": 964.4970440678298 }, { "_prepare_inputs_in_ms": 4.127237547188997, "compute_loss_in_ms": 267.12262638285756, "epoch": 29.76, "learning_rate/full": 0.0002857387308278068, "loss": 3.688, "step": 72000, "training_step_in_ms": 963.8779099695385 }, { "_prepare_inputs_in_ms": 4.134644038975239, "compute_loss_in_ms": 268.62900394946337, "epoch": 30.18, "learning_rate/full": 0.0002828899985518552, "loss": 3.6777, "step": 73000, "training_step_in_ms": 966.1114624030888 }, { "_prepare_inputs_in_ms": 4.121612053364515, "compute_loss_in_ms": 267.61186150833964, "epoch": 30.59, "learning_rate/full": 0.00028002081440907064, "loss": 3.6805, "step": 74000, "training_step_in_ms": 966.5145794674754 }, { "_prepare_inputs_in_ms": 4.143208879977465, "compute_loss_in_ms": 268.1201763525605, "epoch": 31.0, "learning_rate/full": 0.00027713188632770775, "loss": 3.6879, "step": 75000, "training_step_in_ms": 965.0215070433915 }, { "epoch": 31.0, "eval_visual_genome-densecap-local-densecap-test_loss": 3.5912275314331055, "eval_visual_genome-densecap-local-densecap-test_meteor": 0.26092454356630995, "eval_visual_genome-densecap-local-densecap-test_runtime": 78.6905, "eval_visual_genome-densecap-local-densecap-test_samples_per_second": 10.166, "eval_visual_genome-densecap-local-densecap-test_steps_per_second": 0.318, "step": 75000 }, { "_prepare_inputs_in_ms": 4.137767382511279, "compute_loss_in_ms": 267.779229991138, "epoch": 31.42, "learning_rate/full": 0.00027422684725453034, "loss": 3.6725, "step": 76000, "training_step_in_ms": 963.9590919055045 }, { "_prepare_inputs_in_ms": 4.138436369597912, "compute_loss_in_ms": 268.5314156524837, "epoch": 31.83, "learning_rate/full": 0.0002712976542440004, "loss": 3.6758, "step": 77000, "training_step_in_ms": 964.5805881880224 }, { "_prepare_inputs_in_ms": 4.146489001810551, "compute_loss_in_ms": 268.08270847052336, "epoch": 32.24, "learning_rate/full": 0.00026835083436875734, "loss": 3.6692, "step": 78000, "training_step_in_ms": 966.2784307040274 }, { "_prepare_inputs_in_ms": 4.1479257568717, "compute_loss_in_ms": 267.2712250612676, "epoch": 32.66, "learning_rate/full": 0.0002653930599834242, "loss": 3.6736, "step": 79000, "training_step_in_ms": 968.4041320718825 }, { "_prepare_inputs_in_ms": 4.126915082335472, "compute_loss_in_ms": 268.5138017758727, "epoch": 33.07, "learning_rate/full": 0.0002624132077738845, "loss": 3.6731, "step": 80000, "training_step_in_ms": 969.1153637133539 }, { "epoch": 33.07, "eval_visual_genome-densecap-local-densecap-test_loss": 3.5850701332092285, "eval_visual_genome-densecap-local-densecap-test_meteor": 0.2637883107097123, "eval_visual_genome-densecap-local-densecap-test_runtime": 77.0939, "eval_visual_genome-densecap-local-densecap-test_samples_per_second": 10.377, "eval_visual_genome-densecap-local-densecap-test_steps_per_second": 0.324, "step": 80000 }, { "_prepare_inputs_in_ms": 4.120095092348937, "compute_loss_in_ms": 267.7357228696346, "epoch": 33.48, "learning_rate/full": 0.0002594179251945605, "loss": 3.6671, "step": 81000, "training_step_in_ms": 963.6873134560883 }, { "_prepare_inputs_in_ms": 4.124605063349009, "compute_loss_in_ms": 267.57319816574454, "epoch": 33.9, "learning_rate/full": 0.00025641096982950234, "loss": 3.6662, "step": 82000, "training_step_in_ms": 965.3064449094236 }, { "_prepare_inputs_in_ms": 4.129976071417332, "compute_loss_in_ms": 267.9822950810194, "epoch": 34.31, "learning_rate/full": 0.00025339009590173424, "loss": 3.6651, "step": 83000, "training_step_in_ms": 967.112907551229 }, { "_prepare_inputs_in_ms": 4.144246697425842, "compute_loss_in_ms": 268.09172417223454, "epoch": 34.73, "learning_rate/full": 0.0002503530053325778, "loss": 3.6622, "step": 84000, "training_step_in_ms": 963.3224161304533 }, { "_prepare_inputs_in_ms": 4.138608705252409, "compute_loss_in_ms": 267.34737430512905, "epoch": 35.14, "learning_rate/full": 0.0002473065215350535, "loss": 3.66, "step": 85000, "training_step_in_ms": 964.2706917002797 }, { "epoch": 35.14, "eval_visual_genome-densecap-local-densecap-test_loss": 3.5811269283294678, "eval_visual_genome-densecap-local-densecap-test_meteor": 0.2639846881301574, "eval_visual_genome-densecap-local-densecap-test_runtime": 78.4776, "eval_visual_genome-densecap-local-densecap-test_samples_per_second": 10.194, "eval_visual_genome-densecap-local-densecap-test_steps_per_second": 0.319, "step": 85000 }, { "_prepare_inputs_in_ms": 4.154233903419681, "compute_loss_in_ms": 267.71352230757475, "epoch": 35.55, "learning_rate/full": 0.00024424836556120313, "loss": 3.6547, "step": 86000, "training_step_in_ms": 962.3722572363913 }, { "_prepare_inputs_in_ms": 4.109987150877714, "compute_loss_in_ms": 267.4717643670738, "epoch": 35.97, "learning_rate/full": 0.000241179291965253, "loss": 3.662, "step": 87000, "training_step_in_ms": 962.7631023935974 }, { "_prepare_inputs_in_ms": 4.130292858928442, "compute_loss_in_ms": 268.7110885903239, "epoch": 36.38, "learning_rate/full": 0.0002381000579951894, "loss": 3.6533, "step": 88000, "training_step_in_ms": 966.5117364116013 }, { "_prepare_inputs_in_ms": 4.127315446734428, "compute_loss_in_ms": 267.80369279161096, "epoch": 36.79, "learning_rate/full": 0.00023501142340591894, "loss": 3.6541, "step": 89000, "training_step_in_ms": 966.1625612042844 }, { "_prepare_inputs_in_ms": 4.147790517657995, "compute_loss_in_ms": 268.44236666709185, "epoch": 37.21, "learning_rate/full": 0.00023191415027181022, "loss": 3.6505, "step": 90000, "training_step_in_ms": 969.9625728055835 }, { "epoch": 37.21, "eval_visual_genome-densecap-local-densecap-test_loss": 3.5739023685455322, "eval_visual_genome-densecap-local-densecap-test_meteor": 0.2666824586460844, "eval_visual_genome-densecap-local-densecap-test_runtime": 78.5693, "eval_visual_genome-densecap-local-densecap-test_samples_per_second": 10.182, "eval_visual_genome-densecap-local-densecap-test_steps_per_second": 0.318, "step": 90000 }, { "_prepare_inputs_in_ms": 4.1041579188370125, "compute_loss_in_ms": 267.84072072431445, "epoch": 37.62, "learning_rate/full": 0.00022880900279866363, "loss": 3.6517, "step": 91000, "training_step_in_ms": 962.2163318134844 }, { "_prepare_inputs_in_ms": 4.135395355522633, "compute_loss_in_ms": 267.92124405503273, "epoch": 38.03, "learning_rate/full": 0.0002256936284593779, "loss": 3.6526, "step": 92000, "training_step_in_ms": 965.9340194314718 }, { "_prepare_inputs_in_ms": 4.124495934695005, "compute_loss_in_ms": 267.63855477049947, "epoch": 38.45, "learning_rate/full": 0.00022257502654664658, "loss": 3.6411, "step": 93000, "training_step_in_ms": 968.471509065479 }, { "_prepare_inputs_in_ms": 4.13615457713604, "compute_loss_in_ms": 268.6791280247271, "epoch": 38.86, "learning_rate/full": 0.00021945398441148287, "loss": 3.6456, "step": 94000, "training_step_in_ms": 964.7193784303963 }, { "_prepare_inputs_in_ms": 4.138962186872959, "compute_loss_in_ms": 267.87416788190603, "epoch": 39.27, "learning_rate/full": 0.00021632188341385878, "loss": 3.6474, "step": 95000, "training_step_in_ms": 964.3936127200723 }, { "epoch": 39.27, "eval_visual_genome-densecap-local-densecap-test_loss": 3.570530414581299, "eval_visual_genome-densecap-local-densecap-test_meteor": 0.26555671498307476, "eval_visual_genome-densecap-local-densecap-test_runtime": 77.8889, "eval_visual_genome-densecap-local-densecap-test_samples_per_second": 10.271, "eval_visual_genome-densecap-local-densecap-test_steps_per_second": 0.321, "step": 95000 }, { "_prepare_inputs_in_ms": 4.114193618297577, "compute_loss_in_ms": 267.61803087219596, "epoch": 39.69, "learning_rate/full": 0.0002131888850633025, "loss": 3.6443, "step": 96000, "training_step_in_ms": 962.9699364975095 }, { "_prepare_inputs_in_ms": 4.118229653686285, "compute_loss_in_ms": 267.60003339126706, "epoch": 40.1, "learning_rate/full": 0.00021005263255270636, "loss": 3.6436, "step": 97000, "training_step_in_ms": 967.0044349320233 }, { "_prepare_inputs_in_ms": 4.14753895252943, "compute_loss_in_ms": 267.94382878765464, "epoch": 40.51, "learning_rate/full": 0.00020691389970544863, "loss": 3.6409, "step": 98000, "training_step_in_ms": 965.2209133654833 }, { "_prepare_inputs_in_ms": 4.132391892373562, "compute_loss_in_ms": 268.32156636565924, "epoch": 40.93, "learning_rate/full": 0.00020377031677881017, "loss": 3.6386, "step": 99000, "training_step_in_ms": 965.1960897520185 }, { "_prepare_inputs_in_ms": 4.139371138066053, "compute_loss_in_ms": 268.1989936903119, "epoch": 41.34, "learning_rate/full": 0.00020062894644154732, "loss": 3.628, "step": 100000, "training_step_in_ms": 969.4596163183451 }, { "epoch": 41.34, "eval_visual_genome-densecap-local-densecap-test_loss": 3.565774440765381, "eval_visual_genome-densecap-local-densecap-test_meteor": 0.26571601552352997, "eval_visual_genome-densecap-local-densecap-test_runtime": 77.6144, "eval_visual_genome-densecap-local-densecap-test_samples_per_second": 10.307, "eval_visual_genome-densecap-local-densecap-test_steps_per_second": 0.322, "step": 100000 }, { "_prepare_inputs_in_ms": 4.108485870245026, "compute_loss_in_ms": 267.23163178935647, "epoch": 41.75, "learning_rate/full": 0.00019748742092116103, "loss": 3.6364, "step": 101000, "training_step_in_ms": 962.6803079359233 }, { "_prepare_inputs_in_ms": 4.145125687122345, "compute_loss_in_ms": 267.68679490312934, "epoch": 42.17, "learning_rate/full": 0.00019434651534206603, "loss": 3.6315, "step": 102000, "training_step_in_ms": 964.9059623852372 }, { "_prepare_inputs_in_ms": 4.14092817902565, "compute_loss_in_ms": 268.40766886249185, "epoch": 42.58, "learning_rate/full": 0.00019120700467571537, "loss": 3.6249, "step": 103000, "training_step_in_ms": 968.5381288193166 }, { "_prepare_inputs_in_ms": 4.131742633879185, "compute_loss_in_ms": 267.6234121248126, "epoch": 42.99, "learning_rate/full": 0.00018806966354938863, "loss": 3.6302, "step": 104000, "training_step_in_ms": 965.0357882864773 }, { "_prepare_inputs_in_ms": 4.159636992961168, "compute_loss_in_ms": 268.2043272703886, "epoch": 43.41, "learning_rate/full": 0.0001849352660550636, "loss": 3.6221, "step": 105000, "training_step_in_ms": 966.8701088428497 }, { "epoch": 43.41, "eval_visual_genome-densecap-local-densecap-test_loss": 3.560976266860962, "eval_visual_genome-densecap-local-densecap-test_meteor": 0.2679473083105533, "eval_visual_genome-densecap-local-densecap-test_runtime": 78.6952, "eval_visual_genome-densecap-local-densecap-test_samples_per_second": 10.166, "eval_visual_genome-densecap-local-densecap-test_steps_per_second": 0.318, "step": 105000 }, { "_prepare_inputs_in_ms": 4.1656713769203275, "compute_loss_in_ms": 267.7097022458911, "epoch": 43.82, "learning_rate/full": 0.00018180458555842107, "loss": 3.6281, "step": 106000, "training_step_in_ms": 960.9392982535064 }, { "_prepare_inputs_in_ms": 4.1548894718289375, "compute_loss_in_ms": 268.3351138718426, "epoch": 44.23, "learning_rate/full": 0.00017867839450802815, "loss": 3.6257, "step": 107000, "training_step_in_ms": 967.5997758358717 }, { "_prepare_inputs_in_ms": 4.136493876576424, "compute_loss_in_ms": 267.79356829449534, "epoch": 44.65, "learning_rate/full": 0.0001755574642447484, "loss": 3.6275, "step": 108000, "training_step_in_ms": 964.6688169278204 }, { "_prepare_inputs_in_ms": 4.146924342960119, "compute_loss_in_ms": 268.7044747136533, "epoch": 45.06, "learning_rate/full": 0.00017244256481142465, "loss": 3.6272, "step": 109000, "training_step_in_ms": 966.0691562928259 }, { "_prepare_inputs_in_ms": 4.129870388656855, "compute_loss_in_ms": 267.92700193077326, "epoch": 45.47, "learning_rate/full": 0.00016933446476288295, "loss": 3.6231, "step": 110000, "training_step_in_ms": 968.8978024721146 }, { "epoch": 45.47, "eval_visual_genome-densecap-local-densecap-test_loss": 3.557985544204712, "eval_visual_genome-densecap-local-densecap-test_meteor": 0.26707363597972006, "eval_visual_genome-densecap-local-densecap-test_runtime": 77.4146, "eval_visual_genome-densecap-local-densecap-test_samples_per_second": 10.334, "eval_visual_genome-densecap-local-densecap-test_steps_per_second": 0.323, "step": 110000 }, { "_prepare_inputs_in_ms": 4.14337538001014, "compute_loss_in_ms": 267.68642891570926, "epoch": 45.89, "learning_rate/full": 0.0001662308313853947, "loss": 3.6179, "step": 111000, "training_step_in_ms": 963.7148243077099 }, { "_prepare_inputs_in_ms": 4.14999657869339, "compute_loss_in_ms": 267.70868534594774, "epoch": 46.3, "learning_rate/full": 0.000163135546733723, "loss": 3.6124, "step": 112000, "training_step_in_ms": 967.6017691344023 }, { "_prepare_inputs_in_ms": 4.146619476377964, "compute_loss_in_ms": 268.191356562078, "epoch": 46.71, "learning_rate/full": 0.00016005245741683915, "loss": 3.62, "step": 113000, "training_step_in_ms": 966.300628580153 }, { "_prepare_inputs_in_ms": 4.153369773179293, "compute_loss_in_ms": 267.8536421582103, "epoch": 47.13, "learning_rate/full": 0.00015697922455833988, "loss": 3.6157, "step": 114000, "training_step_in_ms": 964.6176136285067 }, { "_prepare_inputs_in_ms": 4.187301464378834, "compute_loss_in_ms": 268.31423101201653, "epoch": 47.54, "learning_rate/full": 0.0001539166064324471, "loss": 3.6143, "step": 115000, "training_step_in_ms": 968.9795580692589 }, { "epoch": 47.54, "eval_visual_genome-densecap-local-densecap-test_loss": 3.556086778640747, "eval_visual_genome-densecap-local-densecap-test_meteor": 0.2680325079129448, "eval_visual_genome-densecap-local-densecap-test_runtime": 78.6426, "eval_visual_genome-densecap-local-densecap-test_samples_per_second": 10.173, "eval_visual_genome-densecap-local-densecap-test_steps_per_second": 0.318, "step": 115000 }, { "_prepare_inputs_in_ms": 4.146232630421475, "compute_loss_in_ms": 267.5073589235544, "epoch": 47.95, "learning_rate/full": 0.00015086535869435647, "loss": 3.6143, "step": 116000, "training_step_in_ms": 961.0740608982742 }, { "_prepare_inputs_in_ms": 4.149144068360329, "compute_loss_in_ms": 268.67081797868013, "epoch": 48.37, "learning_rate/full": 0.00014782623419379065, "loss": 3.6076, "step": 117000, "training_step_in_ms": 968.1870553046465 }, { "_prepare_inputs_in_ms": 4.165053818374872, "compute_loss_in_ms": 267.5217378772795, "epoch": 48.78, "learning_rate/full": 0.00014479998278924466, "loss": 3.6033, "step": 118000, "training_step_in_ms": 964.0207477062941 }, { "_prepare_inputs_in_ms": 4.148088995367289, "compute_loss_in_ms": 267.9359416142106, "epoch": 49.19, "learning_rate/full": 0.00014178735116296984, "loss": 3.6099, "step": 119000, "training_step_in_ms": 965.35854877159 }, { "_prepare_inputs_in_ms": 4.147441305220127, "compute_loss_in_ms": 268.18652522563934, "epoch": 49.61, "learning_rate/full": 0.00013878908263674099, "loss": 3.6041, "step": 120000, "training_step_in_ms": 966.7598981000483 }, { "epoch": 49.61, "eval_visual_genome-densecap-local-densecap-test_loss": 3.5552496910095215, "eval_visual_genome-densecap-local-densecap-test_meteor": 0.2690825925881079, "eval_visual_genome-densecap-local-densecap-test_runtime": 77.206, "eval_visual_genome-densecap-local-densecap-test_samples_per_second": 10.362, "eval_visual_genome-densecap-local-densecap-test_steps_per_second": 0.324, "step": 120000 }, { "_prepare_inputs_in_ms": 4.151007533073425, "compute_loss_in_ms": 267.91314566135406, "epoch": 50.02, "learning_rate/full": 0.00013580293864950247, "loss": 3.6068, "step": 121000, "training_step_in_ms": 965.1756884045899 }, { "_prepare_inputs_in_ms": 4.154482748359442, "compute_loss_in_ms": 268.1262241154909, "epoch": 50.43, "learning_rate/full": 0.00013283562815289706, "loss": 3.5972, "step": 122000, "training_step_in_ms": 965.2079959511757 }, { "_prepare_inputs_in_ms": 4.1559099070727825, "compute_loss_in_ms": 267.7796282917261, "epoch": 50.85, "learning_rate/full": 0.0001298848894600429, "loss": 3.6031, "step": 123000, "training_step_in_ms": 966.0297281630337 }, { "_prepare_inputs_in_ms": 4.1683206632733345, "compute_loss_in_ms": 268.80906841158867, "epoch": 51.26, "learning_rate/full": 0.00012694852315582903, "loss": 3.5985, "step": 124000, "training_step_in_ms": 967.5091603025794 }, { "_prepare_inputs_in_ms": 4.137588050216436, "compute_loss_in_ms": 267.6871258877218, "epoch": 51.67, "learning_rate/full": 0.00012403603541958643, "loss": 3.6029, "step": 125000, "training_step_in_ms": 964.4286920540035 }, { "epoch": 51.67, "eval_visual_genome-densecap-local-densecap-test_loss": 3.5499510765075684, "eval_visual_genome-densecap-local-densecap-test_meteor": 0.268844144332836, "eval_visual_genome-densecap-local-densecap-test_runtime": 77.7216, "eval_visual_genome-densecap-local-densecap-test_samples_per_second": 10.293, "eval_visual_genome-densecap-local-densecap-test_steps_per_second": 0.322, "step": 125000 }, { "_prepare_inputs_in_ms": 4.127907207826289, "compute_loss_in_ms": 267.8013560883701, "epoch": 52.09, "learning_rate/full": 0.00012113936318920029, "loss": 3.5962, "step": 126000, "training_step_in_ms": 962.9286280833185 }, { "_prepare_inputs_in_ms": 4.151306886225939, "compute_loss_in_ms": 267.83537547290325, "epoch": 52.5, "learning_rate/full": 0.00011825927853225391, "loss": 3.5974, "step": 127000, "training_step_in_ms": 967.7427954226732 }, { "_prepare_inputs_in_ms": 4.118186391890049, "compute_loss_in_ms": 268.2419737614691, "epoch": 52.91, "learning_rate/full": 0.00011540225211753402, "loss": 3.5979, "step": 128000, "training_step_in_ms": 963.5640154518187 }, { "_prepare_inputs_in_ms": 4.146437399089336, "compute_loss_in_ms": 267.88536206260324, "epoch": 53.33, "learning_rate/full": 0.00011256609893124084, "loss": 3.5919, "step": 129000, "training_step_in_ms": 965.4581209644675 }, { "_prepare_inputs_in_ms": 4.140674088150263, "compute_loss_in_ms": 267.7817959152162, "epoch": 53.74, "learning_rate/full": 0.00010975151875173475, "loss": 3.5954, "step": 130000, "training_step_in_ms": 967.2819016650319 }, { "epoch": 53.74, "eval_visual_genome-densecap-local-densecap-test_loss": 3.5497984886169434, "eval_visual_genome-densecap-local-densecap-test_meteor": 0.27146193885645503, "eval_visual_genome-densecap-local-densecap-test_runtime": 77.8468, "eval_visual_genome-densecap-local-densecap-test_samples_per_second": 10.277, "eval_visual_genome-densecap-local-densecap-test_steps_per_second": 0.321, "step": 130000 }, { "_prepare_inputs_in_ms": 4.144404723149974, "compute_loss_in_ms": 267.8810519017279, "epoch": 54.15, "learning_rate/full": 0.00010695920603455975, "loss": 3.5914, "step": 131000, "training_step_in_ms": 962.7643201723695 }, { "_prepare_inputs_in_ms": 4.15174587816, "compute_loss_in_ms": 268.55379743501544, "epoch": 54.57, "learning_rate/full": 0.00010418984974109642, "loss": 3.5916, "step": 132000, "training_step_in_ms": 965.8136657737195 }, { "_prepare_inputs_in_ms": 4.164624106138945, "compute_loss_in_ms": 268.1068575233221, "epoch": 54.98, "learning_rate/full": 0.00010144413316857143, "loss": 3.5824, "step": 133000, "training_step_in_ms": 961.5831676833332 }, { "_prepare_inputs_in_ms": 4.1917338743805885, "compute_loss_in_ms": 268.29790291562676, "epoch": 55.39, "learning_rate/full": 9.872273378146393e-05, "loss": 3.5822, "step": 134000, "training_step_in_ms": 967.4604325480759 }, { "_prepare_inputs_in_ms": 4.154745582491159, "compute_loss_in_ms": 268.35503727942705, "epoch": 55.81, "learning_rate/full": 9.602632304435166e-05, "loss": 3.5837, "step": 135000, "training_step_in_ms": 963.2355434708297 }, { "epoch": 55.81, "eval_visual_genome-densecap-local-densecap-test_loss": 3.5466184616088867, "eval_visual_genome-densecap-local-densecap-test_meteor": 0.2701472521164958, "eval_visual_genome-densecap-local-densecap-test_runtime": 77.7707, "eval_visual_genome-densecap-local-densecap-test_samples_per_second": 10.287, "eval_visual_genome-densecap-local-densecap-test_steps_per_second": 0.321, "step": 135000 }, { "_prepare_inputs_in_ms": 4.1385579000159005, "compute_loss_in_ms": 268.1807456240058, "epoch": 56.22, "learning_rate/full": 9.335556625623667e-05, "loss": 3.5886, "step": 136000, "training_step_in_ms": 964.7279985249043 }, { "_prepare_inputs_in_ms": 4.140180014073849, "compute_loss_in_ms": 268.0731739960611, "epoch": 56.63, "learning_rate/full": 9.071112238639306e-05, "loss": 3.5841, "step": 137000, "training_step_in_ms": 964.2245756573975 }, { "_prepare_inputs_in_ms": 4.159709714353085, "compute_loss_in_ms": 268.24955869838595, "epoch": 57.05, "learning_rate/full": 8.809103753928327e-05, "loss": 3.5843, "step": 138000, "training_step_in_ms": 966.5491472817957 }, { "_prepare_inputs_in_ms": 4.165288005024195, "compute_loss_in_ms": 268.81143694743514, "epoch": 57.46, "learning_rate/full": 8.550119824369325e-05, "loss": 3.5867, "step": 139000, "training_step_in_ms": 964.0126786530018 }, { "_prepare_inputs_in_ms": 4.144395582377911, "compute_loss_in_ms": 268.206242531538, "epoch": 57.88, "learning_rate/full": 8.29370600270935e-05, "loss": 3.5852, "step": 140000, "training_step_in_ms": 962.685001052916 }, { "epoch": 57.88, "eval_visual_genome-densecap-local-densecap-test_loss": 3.5455029010772705, "eval_visual_genome-densecap-local-densecap-test_meteor": 0.2711795494440531, "eval_visual_genome-densecap-local-densecap-test_runtime": 77.9766, "eval_visual_genome-densecap-local-densecap-test_samples_per_second": 10.259, "eval_visual_genome-densecap-local-densecap-test_steps_per_second": 0.321, "step": 140000 }, { "_prepare_inputs_in_ms": 4.152141958475113, "compute_loss_in_ms": 267.9933222196996, "epoch": 58.29, "learning_rate/full": 8.040438372331344e-05, "loss": 3.5737, "step": 141000, "training_step_in_ms": 965.1287141442299 }, { "_prepare_inputs_in_ms": 4.142403397709131, "compute_loss_in_ms": 267.5065658353269, "epoch": 58.7, "learning_rate/full": 7.790121584830201e-05, "loss": 3.575, "step": 142000, "training_step_in_ms": 962.7664158046246 }, { "_prepare_inputs_in_ms": 4.150233589112759, "compute_loss_in_ms": 268.65408623218536, "epoch": 59.12, "learning_rate/full": 7.542817402127658e-05, "loss": 3.5709, "step": 143000, "training_step_in_ms": 964.2099178209901 }, { "_prepare_inputs_in_ms": 4.130799826234579, "compute_loss_in_ms": 267.8640896603465, "epoch": 59.53, "learning_rate/full": 7.298586842830323e-05, "loss": 3.5775, "step": 144000, "training_step_in_ms": 964.5784216374159 }, { "_prepare_inputs_in_ms": 4.146471511572599, "compute_loss_in_ms": 268.14434216171503, "epoch": 59.94, "learning_rate/full": 7.057490167174197e-05, "loss": 3.5781, "step": 145000, "training_step_in_ms": 964.2295859828591 }, { "epoch": 59.94, "eval_visual_genome-densecap-local-densecap-test_loss": 3.5419652462005615, "eval_visual_genome-densecap-local-densecap-test_meteor": 0.2710637844956296, "eval_visual_genome-densecap-local-densecap-test_runtime": 78.2475, "eval_visual_genome-densecap-local-densecap-test_samples_per_second": 10.224, "eval_visual_genome-densecap-local-densecap-test_steps_per_second": 0.319, "step": 145000 }, { "_prepare_inputs_in_ms": 4.13495619122575, "compute_loss_in_ms": 267.6772438697517, "epoch": 60.36, "learning_rate/full": 6.819586862156388e-05, "loss": 3.5713, "step": 146000, "training_step_in_ms": 963.0674764961004 }, { "_prepare_inputs_in_ms": 4.138938769698143, "compute_loss_in_ms": 268.4652929417789, "epoch": 60.77, "learning_rate/full": 6.58493562685758e-05, "loss": 3.5755, "step": 147000, "training_step_in_ms": 965.1382315270603 }, { "_prepare_inputs_in_ms": 4.149636901915073, "compute_loss_in_ms": 268.6144716888666, "epoch": 61.18, "learning_rate/full": 6.35336446255852e-05, "loss": 3.5689, "step": 148000, "training_step_in_ms": 967.6213804855943 }, { "_prepare_inputs_in_ms": 4.154591448605061, "compute_loss_in_ms": 268.10440719127655, "epoch": 61.6, "learning_rate/full": 6.125393638794017e-05, "loss": 3.5736, "step": 149000, "training_step_in_ms": 966.7320594601333 }, { "_prepare_inputs_in_ms": 4.149040505290031, "compute_loss_in_ms": 268.75643199309707, "epoch": 62.01, "learning_rate/full": 5.900623127984053e-05, "loss": 3.57, "step": 150000, "training_step_in_ms": 965.394243825227 }, { "epoch": 62.01, "eval_visual_genome-densecap-local-densecap-test_loss": 3.542189359664917, "eval_visual_genome-densecap-local-densecap-test_meteor": 0.27182213175584513, "eval_visual_genome-densecap-local-densecap-test_runtime": 78.2758, "eval_visual_genome-densecap-local-densecap-test_samples_per_second": 10.22, "eval_visual_genome-densecap-local-densecap-test_steps_per_second": 0.319, "step": 150000 }, { "_prepare_inputs_in_ms": 4.197841770038372, "compute_loss_in_ms": 268.5856811106205, "epoch": 62.42, "learning_rate/full": 5.6795579206763614e-05, "loss": 3.5655, "step": 151000, "training_step_in_ms": 963.427967004478 }, { "_prepare_inputs_in_ms": 4.1404072009027, "compute_loss_in_ms": 267.94744442403316, "epoch": 62.84, "learning_rate/full": 5.462026068170363e-05, "loss": 3.5665, "step": 152000, "training_step_in_ms": 965.5440159775317 }, { "_prepare_inputs_in_ms": 4.148986879736185, "compute_loss_in_ms": 268.1357101947069, "epoch": 63.25, "learning_rate/full": 5.247868899032384e-05, "loss": 3.5648, "step": 153000, "training_step_in_ms": 965.260343439877 }, { "_prepare_inputs_in_ms": 4.144355583935976, "compute_loss_in_ms": 268.8695700503886, "epoch": 63.66, "learning_rate/full": 5.0375675588795876e-05, "loss": 3.5699, "step": 154000, "training_step_in_ms": 968.1045257672668 }, { "_prepare_inputs_in_ms": 4.134350396692753, "compute_loss_in_ms": 267.78631913661957, "epoch": 64.08, "learning_rate/full": 4.830957975043959e-05, "loss": 3.5654, "step": 155000, "training_step_in_ms": 965.367557708174 }, { "epoch": 64.08, "eval_visual_genome-densecap-local-densecap-test_loss": 3.5409913063049316, "eval_visual_genome-densecap-local-densecap-test_meteor": 0.273054083346476, "eval_visual_genome-densecap-local-densecap-test_runtime": 78.4578, "eval_visual_genome-densecap-local-densecap-test_samples_per_second": 10.197, "eval_visual_genome-densecap-local-densecap-test_steps_per_second": 0.319, "step": 155000 }, { "_prepare_inputs_in_ms": 4.169517766411712, "compute_loss_in_ms": 267.94907980412245, "epoch": 64.49, "learning_rate/full": 4.628091125348743e-05, "loss": 3.562, "step": 156000, "training_step_in_ms": 964.7187770940363 }, { "_prepare_inputs_in_ms": 4.127725187689066, "compute_loss_in_ms": 267.56007508188486, "epoch": 64.9, "learning_rate/full": 4.429017064153536e-05, "loss": 3.5599, "step": 157000, "training_step_in_ms": 961.402901135385 }, { "_prepare_inputs_in_ms": 4.122306831181049, "compute_loss_in_ms": 268.3586079515517, "epoch": 65.32, "learning_rate/full": 4.233784910004124e-05, "loss": 3.5666, "step": 158000, "training_step_in_ms": 965.8669985719025 }, { "_prepare_inputs_in_ms": 4.136414989829063, "compute_loss_in_ms": 267.9736096225679, "epoch": 65.73, "learning_rate/full": 4.0424428335132335e-05, "loss": 3.5573, "step": 159000, "training_step_in_ms": 965.0534134693444 }, { "_prepare_inputs_in_ms": 4.14548010751605, "compute_loss_in_ms": 268.10164315626025, "epoch": 66.14, "learning_rate/full": 3.855038045475119e-05, "loss": 3.5569, "step": 160000, "training_step_in_ms": 965.0257755257189 }, { "epoch": 66.14, "eval_visual_genome-densecap-local-densecap-test_loss": 3.540762424468994, "eval_visual_genome-densecap-local-densecap-test_meteor": 0.2735980306318844, "eval_visual_genome-densecap-local-densecap-test_runtime": 77.6347, "eval_visual_genome-densecap-local-densecap-test_samples_per_second": 10.305, "eval_visual_genome-densecap-local-densecap-test_steps_per_second": 0.322, "step": 160000 }, { "_prepare_inputs_in_ms": 4.134731147347427, "compute_loss_in_ms": 268.0676885545254, "epoch": 66.56, "learning_rate/full": 3.671616785217033e-05, "loss": 3.559, "step": 161000, "training_step_in_ms": 961.5968884006143 }, { "_prepare_inputs_in_ms": 4.13828482478857, "compute_loss_in_ms": 268.11520731821656, "epoch": 66.97, "learning_rate/full": 3.4920467704438286e-05, "loss": 3.5617, "step": 162000, "training_step_in_ms": 963.3356633149087 }, { "_prepare_inputs_in_ms": 4.1371137127280235, "compute_loss_in_ms": 267.97775723040104, "epoch": 67.38, "learning_rate/full": 3.3169048798042254e-05, "loss": 3.5629, "step": 163000, "training_step_in_ms": 964.7222346775234 }, { "_prepare_inputs_in_ms": 4.129249203950167, "compute_loss_in_ms": 267.63603001460433, "epoch": 67.8, "learning_rate/full": 3.145532456480391e-05, "loss": 3.5596, "step": 164000, "training_step_in_ms": 964.5063005648553 }, { "_prepare_inputs_in_ms": 4.151564922183752, "compute_loss_in_ms": 268.839259788394, "epoch": 68.21, "learning_rate/full": 2.9784920606062528e-05, "loss": 3.5602, "step": 165000, "training_step_in_ms": 972.3141440451145 }, { "epoch": 68.21, "eval_visual_genome-densecap-local-densecap-test_loss": 3.539008855819702, "eval_visual_genome-densecap-local-densecap-test_meteor": 0.2725576622048259, "eval_visual_genome-densecap-local-densecap-test_runtime": 78.4123, "eval_visual_genome-densecap-local-densecap-test_samples_per_second": 10.202, "eval_visual_genome-densecap-local-densecap-test_steps_per_second": 0.319, "step": 165000 }, { "_prepare_inputs_in_ms": 4.126259837208725, "compute_loss_in_ms": 267.8272004313767, "epoch": 68.62, "learning_rate/full": 2.8156514671178745e-05, "loss": 3.5603, "step": 166000, "training_step_in_ms": 964.2809295020998 }, { "_prepare_inputs_in_ms": 4.134287599474192, "compute_loss_in_ms": 267.94721764326096, "epoch": 69.04, "learning_rate/full": 2.65705085449506e-05, "loss": 3.5591, "step": 167000, "training_step_in_ms": 963.7021813839674 }, { "_prepare_inputs_in_ms": 4.147611241787672, "compute_loss_in_ms": 268.29229406639934, "epoch": 69.45, "learning_rate/full": 2.5025770357450595e-05, "loss": 3.5561, "step": 168000, "training_step_in_ms": 967.2244190610945 }, { "_prepare_inputs_in_ms": 4.15412675216794, "compute_loss_in_ms": 268.25271063297987, "epoch": 69.86, "learning_rate/full": 2.352577066262569e-05, "loss": 3.5576, "step": 169000, "training_step_in_ms": 965.3532739318907 }, { "_prepare_inputs_in_ms": 4.129838448017836, "compute_loss_in_ms": 267.92896181344986, "epoch": 70.28, "learning_rate/full": 2.206931334324922e-05, "loss": 3.5536, "step": 170000, "training_step_in_ms": 965.5082765445113 }, { "epoch": 70.28, "eval_visual_genome-densecap-local-densecap-test_loss": 3.5376806259155273, "eval_visual_genome-densecap-local-densecap-test_meteor": 0.2738309179784362, "eval_visual_genome-densecap-local-densecap-test_runtime": 77.9139, "eval_visual_genome-densecap-local-densecap-test_samples_per_second": 10.268, "eval_visual_genome-densecap-local-densecap-test_steps_per_second": 0.321, "step": 170000 }, { "_prepare_inputs_in_ms": 4.163786387298165, "compute_loss_in_ms": 267.95297726243734, "epoch": 70.69, "learning_rate/full": 2.0656757758371282e-05, "loss": 3.5571, "step": 171000, "training_step_in_ms": 960.7510039620101 }, { "_prepare_inputs_in_ms": 4.137572426348925, "compute_loss_in_ms": 267.8121683038771, "epoch": 71.1, "learning_rate/full": 1.9287105043128472e-05, "loss": 3.555, "step": 172000, "training_step_in_ms": 963.8648240976036 }, { "_prepare_inputs_in_ms": 4.139789171516895, "compute_loss_in_ms": 268.3458735384047, "epoch": 71.52, "learning_rate/full": 1.796343238799574e-05, "loss": 3.5518, "step": 173000, "training_step_in_ms": 965.790959071368 }, { "_prepare_inputs_in_ms": 4.144272416830063, "compute_loss_in_ms": 268.10323084518313, "epoch": 71.93, "learning_rate/full": 1.6684674532049582e-05, "loss": 3.5512, "step": 174000, "training_step_in_ms": 961.3717007525265 }, { "_prepare_inputs_in_ms": 4.1666854321956635, "compute_loss_in_ms": 268.03433157876134, "epoch": 72.34, "learning_rate/full": 1.5451146989656617e-05, "loss": 3.5495, "step": 175000, "training_step_in_ms": 967.3243609592319 }, { "epoch": 72.34, "eval_visual_genome-densecap-local-densecap-test_loss": 3.536776065826416, "eval_visual_genome-densecap-local-densecap-test_meteor": 0.2743759293675203, "eval_visual_genome-densecap-local-densecap-test_runtime": 78.6158, "eval_visual_genome-densecap-local-densecap-test_samples_per_second": 10.176, "eval_visual_genome-densecap-local-densecap-test_steps_per_second": 0.318, "step": 175000 }, { "_prepare_inputs_in_ms": 4.134207051701662, "compute_loss_in_ms": 267.52714550867677, "epoch": 72.76, "learning_rate/full": 1.4261987845053304e-05, "loss": 3.5555, "step": 176000, "training_step_in_ms": 962.5389591343701 }, { "_prepare_inputs_in_ms": 4.146069306880236, "compute_loss_in_ms": 268.7413688749075, "epoch": 73.17, "learning_rate/full": 1.3119868774900613e-05, "loss": 3.5512, "step": 177000, "training_step_in_ms": 964.9299626871943 }, { "_prepare_inputs_in_ms": 4.148835156112909, "compute_loss_in_ms": 268.0495460778475, "epoch": 73.58, "learning_rate/full": 1.2023859580780273e-05, "loss": 3.5529, "step": 178000, "training_step_in_ms": 967.7268707863986 }, { "_prepare_inputs_in_ms": 4.1666895635426044, "compute_loss_in_ms": 268.2634797357023, "epoch": 74.0, "learning_rate/full": 1.0973203331088377e-05, "loss": 3.5538, "step": 179000, "training_step_in_ms": 965.1008929647505 }, { "_prepare_inputs_in_ms": 4.153850518167019, "compute_loss_in_ms": 268.7998457066715, "epoch": 74.41, "learning_rate/full": 9.970260528869224e-06, "loss": 3.5524, "step": 180000, "training_step_in_ms": 968.3517145328224 }, { "epoch": 74.41, "eval_visual_genome-densecap-local-densecap-test_loss": 3.536918878555298, "eval_visual_genome-densecap-local-densecap-test_meteor": 0.2735705193198496, "eval_visual_genome-densecap-local-densecap-test_runtime": 78.7713, "eval_visual_genome-densecap-local-densecap-test_samples_per_second": 10.156, "eval_visual_genome-densecap-local-densecap-test_steps_per_second": 0.317, "step": 180000 }, { "_prepare_inputs_in_ms": 4.127806843054004, "compute_loss_in_ms": 268.1048993989825, "epoch": 74.82, "learning_rate/full": 9.01420472138852e-06, "loss": 3.5468, "step": 181000, "training_step_in_ms": 960.1139997318387 }, { "_prepare_inputs_in_ms": 4.13564395532012, "compute_loss_in_ms": 267.3685629181564, "epoch": 75.24, "learning_rate/full": 8.105271801111003e-06, "loss": 3.552, "step": 182000, "training_step_in_ms": 964.2471651136875 }, { "_prepare_inputs_in_ms": 4.140480011701584, "compute_loss_in_ms": 267.48710445687175, "epoch": 75.65, "learning_rate/full": 7.243686033634145e-06, "loss": 3.5473, "step": 183000, "training_step_in_ms": 966.0506127551198 }, { "_prepare_inputs_in_ms": 4.12862478941679, "compute_loss_in_ms": 268.38187746331096, "epoch": 76.06, "learning_rate/full": 6.429660002353832e-06, "loss": 3.5535, "step": 184000, "training_step_in_ms": 963.8830341026187 }, { "_prepare_inputs_in_ms": 4.138918172568083, "compute_loss_in_ms": 267.91103532910347, "epoch": 76.48, "learning_rate/full": 5.663394556012769e-06, "loss": 3.5489, "step": 185000, "training_step_in_ms": 969.0565127506852 }, { "epoch": 76.48, "eval_visual_genome-densecap-local-densecap-test_loss": 3.5358800888061523, "eval_visual_genome-densecap-local-densecap-test_meteor": 0.2731816800574383, "eval_visual_genome-densecap-local-densecap-test_runtime": 78.2007, "eval_visual_genome-densecap-local-densecap-test_samples_per_second": 10.23, "eval_visual_genome-densecap-local-densecap-test_steps_per_second": 0.32, "step": 185000 }, { "_prepare_inputs_in_ms": 4.125211863982968, "compute_loss_in_ms": 267.94072189182043, "epoch": 76.89, "learning_rate/full": 4.944383807374142e-06, "loss": 3.5495, "step": 186000, "training_step_in_ms": 963.789376296103 }, { "_prepare_inputs_in_ms": 4.155690658837557, "compute_loss_in_ms": 267.86934616044164, "epoch": 77.3, "learning_rate/full": 4.273596510048239e-06, "loss": 3.5465, "step": 187000, "training_step_in_ms": 966.8210936710238 }, { "_prepare_inputs_in_ms": 4.130576055496931, "compute_loss_in_ms": 268.2106507457793, "epoch": 77.72, "learning_rate/full": 3.6517966776118407e-06, "loss": 3.5445, "step": 188000, "training_step_in_ms": 966.5816915780306 }, { "_prepare_inputs_in_ms": 4.133735220879316, "compute_loss_in_ms": 267.8969533368945, "epoch": 78.13, "learning_rate/full": 3.0789924830065154e-06, "loss": 3.5528, "step": 189000, "training_step_in_ms": 964.6940425820649 }, { "_prepare_inputs_in_ms": 4.137146957218647, "compute_loss_in_ms": 267.9762873612344, "epoch": 78.54, "learning_rate/full": 2.5536764226682607e-06, "loss": 3.5458, "step": 190000, "training_step_in_ms": 966.734307706356 }, { "epoch": 78.54, "eval_visual_genome-densecap-local-densecap-test_loss": 3.5369150638580322, "eval_visual_genome-densecap-local-densecap-test_meteor": 0.272921503437743, "eval_visual_genome-densecap-local-densecap-test_runtime": 79.0337, "eval_visual_genome-densecap-local-densecap-test_samples_per_second": 10.122, "eval_visual_genome-densecap-local-densecap-test_steps_per_second": 0.316, "step": 190000 }, { "_prepare_inputs_in_ms": 4.113826969774758, "compute_loss_in_ms": 267.3543768711388, "epoch": 78.96, "learning_rate/full": 2.077174866407172e-06, "loss": 3.5455, "step": 191000, "training_step_in_ms": 959.5898663066328 }, { "_prepare_inputs_in_ms": 4.15868678689003, "compute_loss_in_ms": 268.5514197871089, "epoch": 79.37, "learning_rate/full": 1.650411851111966e-06, "loss": 3.5422, "step": 192000, "training_step_in_ms": 966.848380189389 }, { "_prepare_inputs_in_ms": 4.152705859392881, "compute_loss_in_ms": 267.7775506339967, "epoch": 79.79, "learning_rate/full": 1.2717824473816864e-06, "loss": 3.5542, "step": 193000, "training_step_in_ms": 966.0438013672829 }, { "_prepare_inputs_in_ms": 4.149454560130835, "compute_loss_in_ms": 268.18433906137943, "epoch": 80.2, "learning_rate/full": 9.425893981038769e-07, "loss": 3.5513, "step": 194000, "training_step_in_ms": 968.7132156044245 }, { "_prepare_inputs_in_ms": 4.145272459834814, "compute_loss_in_ms": 269.00753265991807, "epoch": 80.61, "learning_rate/full": 6.625107863321489e-07, "loss": 3.5423, "step": 195000, "training_step_in_ms": 966.2778741791844 }, { "epoch": 80.61, "eval_visual_genome-densecap-local-densecap-test_loss": 3.5363166332244873, "eval_visual_genome-densecap-local-densecap-test_meteor": 0.2732828183368321, "eval_visual_genome-densecap-local-densecap-test_runtime": 78.105, "eval_visual_genome-densecap-local-densecap-test_samples_per_second": 10.243, "eval_visual_genome-densecap-local-densecap-test_steps_per_second": 0.32, "step": 195000 }, { "_prepare_inputs_in_ms": 4.114095866680145, "compute_loss_in_ms": 267.9977478161454, "epoch": 81.03, "learning_rate/full": 4.3161571727299287e-07, "loss": 3.5457, "step": 196000, "training_step_in_ms": 963.1876187734306 }, { "_prepare_inputs_in_ms": 4.132705166935921, "compute_loss_in_ms": 268.0948423668742, "epoch": 81.44, "learning_rate/full": 2.4980400999989885e-07, "loss": 3.5462, "step": 197000, "training_step_in_ms": 967.0936130546033 }, { "_prepare_inputs_in_ms": 4.152493238449097, "compute_loss_in_ms": 268.8196250721812, "epoch": 81.85, "learning_rate/full": 1.174841397763915e-07, "loss": 3.5462, "step": 198000, "training_step_in_ms": 964.0161675550044 }, { "_prepare_inputs_in_ms": 4.15958097204566, "compute_loss_in_ms": 268.9542033970356, "epoch": 82.27, "learning_rate/full": 3.4482289435100457e-08, "loss": 3.5489, "step": 199000, "training_step_in_ms": 964.1794747672975 }, { "_prepare_inputs_in_ms": 4.161274570971727, "compute_loss_in_ms": 268.2289356328547, "epoch": 82.68, "learning_rate/full": 8.099638465708381e-10, "loss": 3.5503, "step": 200000, "training_step_in_ms": 966.4167955368757 }, { "epoch": 82.68, "eval_visual_genome-densecap-local-densecap-test_loss": 3.5363588333129883, "eval_visual_genome-densecap-local-densecap-test_meteor": 0.27337310510486335, "eval_visual_genome-densecap-local-densecap-test_runtime": 78.3968, "eval_visual_genome-densecap-local-densecap-test_samples_per_second": 10.204, "eval_visual_genome-densecap-local-densecap-test_steps_per_second": 0.319, "step": 200000 } ], "max_steps": 200000, "num_train_epochs": 83, "total_flos": 1.6535680980503157e+23, "trial_name": null, "trial_params": null }