ppo-Pyramids / run_logs /timers.json
maartenx01's picture
First Push
628a0a5 verified
raw
history blame
18.8 kB
{
"name": "root",
"gauges": {
"Pyramids.Policy.Entropy.mean": {
"value": 0.15419848263263702,
"min": 0.13651002943515778,
"max": 0.823553740978241,
"count": 80
},
"Pyramids.Policy.Entropy.sum": {
"value": 4633.35595703125,
"min": 3663.1669921875,
"max": 24707.591796875,
"count": 80
},
"Pyramids.Environment.EpisodeLength.mean": {
"value": 214.79136690647482,
"min": 138.16666666666666,
"max": 489.51666666666665,
"count": 80
},
"Pyramids.Environment.EpisodeLength.sum": {
"value": 29856.0,
"min": 829.0,
"max": 31776.0,
"count": 80
},
"Pyramids.Step.mean": {
"value": 2999909.0,
"min": 629931.0,
"max": 2999909.0,
"count": 80
},
"Pyramids.Step.sum": {
"value": 2999909.0,
"min": 629931.0,
"max": 2999909.0,
"count": 80
},
"Pyramids.Policy.ExtrinsicValueEstimate.mean": {
"value": 0.8359577655792236,
"min": 0.25308457016944885,
"max": 0.8370456695556641,
"count": 80
},
"Pyramids.Policy.ExtrinsicValueEstimate.sum": {
"value": 248.27944946289062,
"min": 8.604875564575195,
"max": 252.99343872070312,
"count": 80
},
"Pyramids.Policy.RndValueEstimate.mean": {
"value": 0.005533040966838598,
"min": -0.01403752900660038,
"max": 0.024144239723682404,
"count": 80
},
"Pyramids.Policy.RndValueEstimate.sum": {
"value": 1.6433131694793701,
"min": -4.028770923614502,
"max": 6.905252456665039,
"count": 80
},
"Pyramids.Environment.CumulativeReward.mean": {
"value": 1.7708172537654423,
"min": 1.410446641842524,
"max": 1.8618333041667938,
"count": 80
},
"Pyramids.Environment.CumulativeReward.sum": {
"value": 246.1435982733965,
"min": 11.170999825000763,
"max": 246.1435982733965,
"count": 80
},
"Pyramids.Policy.ExtrinsicReward.mean": {
"value": 1.7708172537654423,
"min": 1.410446641842524,
"max": 1.8618333041667938,
"count": 80
},
"Pyramids.Policy.ExtrinsicReward.sum": {
"value": 246.1435982733965,
"min": 11.170999825000763,
"max": 246.1435982733965,
"count": 80
},
"Pyramids.Policy.RndReward.mean": {
"value": 0.016907050741648826,
"min": 0.014792351323800782,
"max": 0.044656114225896694,
"count": 80
},
"Pyramids.Policy.RndReward.sum": {
"value": 2.3500800530891865,
"min": 0.0887541079428047,
"max": 2.9113981585251167,
"count": 80
},
"Pyramids.Losses.PolicyLoss.mean": {
"value": 0.06731645511844814,
"min": 0.06449578986689057,
"max": 0.07284202956153811,
"count": 80
},
"Pyramids.Losses.PolicyLoss.sum": {
"value": 0.9424303716582739,
"min": 0.06511365686310455,
"max": 1.060511664133325,
"count": 80
},
"Pyramids.Losses.ValueLoss.mean": {
"value": 0.015762173018168138,
"min": 0.007312449966169273,
"max": 0.016672092985356272,
"count": 80
},
"Pyramids.Losses.ValueLoss.sum": {
"value": 0.22067042225435393,
"min": 0.007312449966169273,
"max": 0.24920289873261936,
"count": 80
},
"Pyramids.Policy.LearningRate.mean": {
"value": 1.4407423769285715e-06,
"min": 1.4407423769285715e-06,
"max": 0.00023719272093576668,
"count": 80
},
"Pyramids.Policy.LearningRate.sum": {
"value": 2.0170393277e-05,
"min": 2.0170393277e-05,
"max": 0.0035325708224765,
"count": 80
},
"Pyramids.Policy.Epsilon.mean": {
"value": 0.10048021428571428,
"min": 0.10048021428571428,
"max": 0.17906423333333335,
"count": 80
},
"Pyramids.Policy.Epsilon.sum": {
"value": 1.406723,
"min": 0.17906423333333335,
"max": 2.6775235000000004,
"count": 80
},
"Pyramids.Policy.Beta.mean": {
"value": 5.797340714285716e-05,
"min": 5.797340714285716e-05,
"max": 0.007908516909999998,
"count": 80
},
"Pyramids.Policy.Beta.sum": {
"value": 0.0008116277000000002,
"min": 0.0008116277000000002,
"max": 0.11778459765000002,
"count": 80
},
"Pyramids.Losses.RNDLoss.mean": {
"value": 0.0075660645961761475,
"min": 0.007331254426389933,
"max": 0.009189439006149769,
"count": 80
},
"Pyramids.Losses.RNDLoss.sum": {
"value": 0.10592490434646606,
"min": 0.008900578133761883,
"max": 0.1329563856124878,
"count": 80
},
"Pyramids.IsTraining.mean": {
"value": 1.0,
"min": 1.0,
"max": 1.0,
"count": 80
},
"Pyramids.IsTraining.sum": {
"value": 1.0,
"min": 1.0,
"max": 1.0,
"count": 80
}
},
"metadata": {
"timer_format_version": "0.1.0",
"start_time_seconds": "1726695630",
"python_version": "3.10.12 (main, Sep 11 2024, 15:47:36) [GCC 11.4.0]",
"command_line_arguments": "/usr/local/bin/mlagents-learn ./config/ppo/PyramidsRND.yaml --resume --env=./training-envs-executables/linux/Pyramids/Pyramids --run-id=Pyramids Training --no-graphics",
"mlagents_version": "1.1.0.dev0",
"mlagents_envs_version": "1.1.0.dev0",
"communication_protocol_version": "1.5.0",
"pytorch_version": "2.4.0+cu121",
"numpy_version": "1.23.5",
"end_time_seconds": "1726704165"
},
"total": 8535.375619375,
"count": 1,
"self": 0.7452478820014221,
"children": {
"run_training.setup": {
"total": 0.08237167299967041,
"count": 1,
"self": 0.08237167299967041
},
"TrainerController.start_learning": {
"total": 8534.547999819999,
"count": 1,
"self": 6.145169671061012,
"children": {
"TrainerController._reset_env": {
"total": 3.3979853539999567,
"count": 1,
"self": 3.3979853539999567
},
"TrainerController.advance": {
"total": 8524.909182714937,
"count": 155171,
"self": 6.299874070782607,
"children": {
"env_step": {
"total": 5955.887078486949,
"count": 155171,
"self": 5576.892458963869,
"children": {
"SubprocessEnvManager._take_step": {
"total": 375.4418779521029,
"count": 155171,
"self": 18.163601917177402,
"children": {
"TorchPolicy.evaluate": {
"total": 357.2782760349255,
"count": 148435,
"self": 357.2782760349255
}
}
},
"workers": {
"total": 3.55274157097665,
"count": 155171,
"self": 0.0,
"children": {
"worker_root": {
"total": 8515.977976790391,
"count": 155171,
"is_parallel": true,
"self": 3398.8017618879967,
"children": {
"run_training.setup": {
"total": 0.0,
"count": 0,
"is_parallel": true,
"self": 0.0,
"children": {
"steps_from_proto": {
"total": 0.003266829000040161,
"count": 1,
"is_parallel": true,
"self": 0.001071900000624737,
"children": {
"_process_rank_one_or_two_observation": {
"total": 0.002194928999415424,
"count": 8,
"is_parallel": true,
"self": 0.002194928999415424
}
}
},
"UnityEnvironment.step": {
"total": 0.06434809599977598,
"count": 1,
"is_parallel": true,
"self": 0.0008171239992407209,
"children": {
"UnityEnvironment._generate_step_input": {
"total": 0.0004978870001650648,
"count": 1,
"is_parallel": true,
"self": 0.0004978870001650648
},
"communicator.exchange": {
"total": 0.060996758000328555,
"count": 1,
"is_parallel": true,
"self": 0.060996758000328555
},
"steps_from_proto": {
"total": 0.002036327000041638,
"count": 1,
"is_parallel": true,
"self": 0.00041612399991208804,
"children": {
"_process_rank_one_or_two_observation": {
"total": 0.0016202030001295498,
"count": 8,
"is_parallel": true,
"self": 0.0016202030001295498
}
}
}
}
}
}
},
"UnityEnvironment.step": {
"total": 5117.176214902394,
"count": 155170,
"is_parallel": true,
"self": 120.9194205134263,
"children": {
"UnityEnvironment._generate_step_input": {
"total": 72.63085866806523,
"count": 155170,
"is_parallel": true,
"self": 72.63085866806523
},
"communicator.exchange": {
"total": 4615.281839628038,
"count": 155170,
"is_parallel": true,
"self": 4615.281839628038
},
"steps_from_proto": {
"total": 308.34409609286513,
"count": 155170,
"is_parallel": true,
"self": 68.52710665787299,
"children": {
"_process_rank_one_or_two_observation": {
"total": 239.81698943499214,
"count": 1241360,
"is_parallel": true,
"self": 239.81698943499214
}
}
}
}
}
}
}
}
}
}
},
"trainer_advance": {
"total": 2562.7222301572065,
"count": 155171,
"self": 12.20619110042071,
"children": {
"process_trajectory": {
"total": 410.9088252297897,
"count": 155171,
"self": 410.3971786137881,
"children": {
"RLTrainer._checkpoint": {
"total": 0.5116466160015989,
"count": 5,
"self": 0.5116466160015989
}
}
},
"_update_policy": {
"total": 2139.607213826996,
"count": 1124,
"self": 857.109888902974,
"children": {
"TorchPPOOptimizer.update": {
"total": 1282.497324924022,
"count": 54069,
"self": 1282.497324924022
}
}
}
}
}
}
},
"trainer_threads": {
"total": 1.2420005077729002e-06,
"count": 1,
"self": 1.2420005077729002e-06
},
"TrainerController._save_models": {
"total": 0.09566083800018532,
"count": 1,
"self": 0.0034099340009561274,
"children": {
"RLTrainer._checkpoint": {
"total": 0.0922509039992292,
"count": 1,
"self": 0.0922509039992292
}
}
}
}
}
}
}