ppo-Pyramids / run_logs /timers.json
wuwx's picture
First Push
d156634
{
"name": "root",
"gauges": {
"Pyramids.Policy.Entropy.mean": {
"value": 0.43953874707221985,
"min": 0.42135411500930786,
"max": 1.434498906135559,
"count": 33
},
"Pyramids.Policy.Entropy.sum": {
"value": 13312.75,
"min": 12499.048828125,
"max": 43516.95703125,
"count": 33
},
"Pyramids.Step.mean": {
"value": 989876.0,
"min": 29908.0,
"max": 989876.0,
"count": 33
},
"Pyramids.Step.sum": {
"value": 989876.0,
"min": 29908.0,
"max": 989876.0,
"count": 33
},
"Pyramids.Policy.ExtrinsicValueEstimate.mean": {
"value": 0.3469477593898773,
"min": -0.09750516712665558,
"max": 0.3469477593898773,
"count": 33
},
"Pyramids.Policy.ExtrinsicValueEstimate.sum": {
"value": 90.90031433105469,
"min": -23.49874496459961,
"max": 90.90031433105469,
"count": 33
},
"Pyramids.Policy.RndValueEstimate.mean": {
"value": 0.04918583109974861,
"min": -0.00609207758679986,
"max": 0.3285600244998932,
"count": 33
},
"Pyramids.Policy.RndValueEstimate.sum": {
"value": 12.886688232421875,
"min": -1.4925589561462402,
"max": 77.86872863769531,
"count": 33
},
"Pyramids.Losses.PolicyLoss.mean": {
"value": 0.06638421378508545,
"min": 0.0657467637098582,
"max": 0.07561135002938868,
"count": 33
},
"Pyramids.Losses.PolicyLoss.sum": {
"value": 0.9957632067762817,
"min": 0.5870415161973802,
"max": 1.0853670877986588,
"count": 33
},
"Pyramids.Losses.ValueLoss.mean": {
"value": 0.012467502224813765,
"min": 0.0005424294119835732,
"max": 0.012474717255047705,
"count": 33
},
"Pyramids.Losses.ValueLoss.sum": {
"value": 0.18701253337220647,
"min": 0.007594011767770025,
"max": 0.18701253337220647,
"count": 33
},
"Pyramids.Policy.LearningRate.mean": {
"value": 7.577057474346671e-06,
"min": 7.577057474346671e-06,
"max": 0.00029484495171835,
"count": 33
},
"Pyramids.Policy.LearningRate.sum": {
"value": 0.00011365586211520007,
"min": 0.00011365586211520007,
"max": 0.0036331843889386003,
"count": 33
},
"Pyramids.Policy.Epsilon.mean": {
"value": 0.10252565333333337,
"min": 0.10252565333333337,
"max": 0.19828165,
"count": 33
},
"Pyramids.Policy.Epsilon.sum": {
"value": 1.5378848000000005,
"min": 1.4783222000000003,
"max": 2.6110613999999996,
"count": 33
},
"Pyramids.Policy.Beta.mean": {
"value": 0.00026231276800000013,
"min": 0.00026231276800000013,
"max": 0.009828336835,
"count": 33
},
"Pyramids.Policy.Beta.sum": {
"value": 0.003934691520000002,
"min": 0.003934691520000002,
"max": 0.12112503386000001,
"count": 33
},
"Pyramids.Losses.RNDLoss.mean": {
"value": 0.012602363713085651,
"min": 0.012602363713085651,
"max": 0.44268977642059326,
"count": 33
},
"Pyramids.Losses.RNDLoss.sum": {
"value": 0.18903546035289764,
"min": 0.1861698180437088,
"max": 3.541518211364746,
"count": 33
},
"Pyramids.Environment.EpisodeLength.mean": {
"value": 462.77777777777777,
"min": 462.77777777777777,
"max": 990.8484848484849,
"count": 33
},
"Pyramids.Environment.EpisodeLength.sum": {
"value": 29155.0,
"min": 16451.0,
"max": 32940.0,
"count": 33
},
"Pyramids.Environment.CumulativeReward.mean": {
"value": 1.3149333078236807,
"min": -0.9311636887264975,
"max": 1.3149333078236807,
"count": 33
},
"Pyramids.Environment.CumulativeReward.sum": {
"value": 82.84079839289188,
"min": -30.728401727974415,
"max": 82.84079839289188,
"count": 33
},
"Pyramids.Policy.ExtrinsicReward.mean": {
"value": 1.3149333078236807,
"min": -0.9311636887264975,
"max": 1.3149333078236807,
"count": 33
},
"Pyramids.Policy.ExtrinsicReward.sum": {
"value": 82.84079839289188,
"min": -30.728401727974415,
"max": 82.84079839289188,
"count": 33
},
"Pyramids.Policy.RndReward.mean": {
"value": 0.060952933739856004,
"min": 0.060952933739856004,
"max": 8.373383240664706,
"count": 33
},
"Pyramids.Policy.RndReward.sum": {
"value": 3.8400348256109282,
"min": 3.8400348256109282,
"max": 142.3475150913,
"count": 33
},
"Pyramids.IsTraining.mean": {
"value": 1.0,
"min": 1.0,
"max": 1.0,
"count": 33
},
"Pyramids.IsTraining.sum": {
"value": 1.0,
"min": 1.0,
"max": 1.0,
"count": 33
}
},
"metadata": {
"timer_format_version": "0.1.0",
"start_time_seconds": "1702903524",
"python_version": "3.10.12 (main, Nov 20 2023, 15:14:05) [GCC 11.4.0]",
"command_line_arguments": "/usr/local/bin/mlagents-learn ./config/ppo/PyramidsRND.yaml --env=./training-envs-executables/linux/Pyramids/Pyramids --run-id=Pyramids Training --no-graphics",
"mlagents_version": "1.1.0.dev0",
"mlagents_envs_version": "1.1.0.dev0",
"communication_protocol_version": "1.5.0",
"pytorch_version": "2.1.2+cu121",
"numpy_version": "1.23.5",
"end_time_seconds": "1702905599"
},
"total": 2075.0884569010004,
"count": 1,
"self": 0.8340091170007327,
"children": {
"run_training.setup": {
"total": 0.07078064799998174,
"count": 1,
"self": 0.07078064799998174
},
"TrainerController.start_learning": {
"total": 2074.1836671359997,
"count": 1,
"self": 1.3587929349923797,
"children": {
"TrainerController._reset_env": {
"total": 2.1862086329999784,
"count": 1,
"self": 2.1862086329999784
},
"TrainerController.advance": {
"total": 2070.5545712880066,
"count": 63433,
"self": 1.4231073369774094,
"children": {
"env_step": {
"total": 1454.6072410219901,
"count": 63433,
"self": 1323.446675419085,
"children": {
"SubprocessEnvManager._take_step": {
"total": 130.33998160494707,
"count": 63433,
"self": 4.733357381888027,
"children": {
"TorchPolicy.evaluate": {
"total": 125.60662422305904,
"count": 62563,
"self": 125.60662422305904
}
}
},
"workers": {
"total": 0.8205839979580105,
"count": 63433,
"self": 0.0,
"children": {
"worker_root": {
"total": 2069.217339483954,
"count": 63433,
"is_parallel": true,
"self": 864.1328929329115,
"children": {
"run_training.setup": {
"total": 0.0,
"count": 0,
"is_parallel": true,
"self": 0.0,
"children": {
"steps_from_proto": {
"total": 0.0017604189999929076,
"count": 1,
"is_parallel": true,
"self": 0.0005545830001665308,
"children": {
"_process_rank_one_or_two_observation": {
"total": 0.0012058359998263768,
"count": 8,
"is_parallel": true,
"self": 0.0012058359998263768
}
}
},
"UnityEnvironment.step": {
"total": 0.04853810299982797,
"count": 1,
"is_parallel": true,
"self": 0.0005642249998345505,
"children": {
"UnityEnvironment._generate_step_input": {
"total": 0.00046031800002310774,
"count": 1,
"is_parallel": true,
"self": 0.00046031800002310774
},
"communicator.exchange": {
"total": 0.045917056000007506,
"count": 1,
"is_parallel": true,
"self": 0.045917056000007506
},
"steps_from_proto": {
"total": 0.0015965039999628061,
"count": 1,
"is_parallel": true,
"self": 0.00034127900062230765,
"children": {
"_process_rank_one_or_two_observation": {
"total": 0.0012552249993404985,
"count": 8,
"is_parallel": true,
"self": 0.0012552249993404985
}
}
}
}
}
}
},
"UnityEnvironment.step": {
"total": 1205.0844465510427,
"count": 63432,
"is_parallel": true,
"self": 34.566660914052136,
"children": {
"UnityEnvironment._generate_step_input": {
"total": 24.442632394963084,
"count": 63432,
"is_parallel": true,
"self": 24.442632394963084
},
"communicator.exchange": {
"total": 1047.2239439030443,
"count": 63432,
"is_parallel": true,
"self": 1047.2239439030443
},
"steps_from_proto": {
"total": 98.85120933898315,
"count": 63432,
"is_parallel": true,
"self": 19.95006917710134,
"children": {
"_process_rank_one_or_two_observation": {
"total": 78.90114016188181,
"count": 507456,
"is_parallel": true,
"self": 78.90114016188181
}
}
}
}
}
}
}
}
}
}
},
"trainer_advance": {
"total": 614.5242229290388,
"count": 63433,
"self": 2.6567191330489095,
"children": {
"process_trajectory": {
"total": 123.2409316149899,
"count": 63433,
"self": 123.0471291259903,
"children": {
"RLTrainer._checkpoint": {
"total": 0.1938024889996086,
"count": 2,
"self": 0.1938024889996086
}
}
},
"_update_policy": {
"total": 488.62657218100003,
"count": 454,
"self": 291.85564948799697,
"children": {
"TorchPPOOptimizer.update": {
"total": 196.77092269300306,
"count": 22764,
"self": 196.77092269300306
}
}
}
}
}
}
},
"trainer_threads": {
"total": 9.120003596763127e-07,
"count": 1,
"self": 9.120003596763127e-07
},
"TrainerController._save_models": {
"total": 0.08409336800013989,
"count": 1,
"self": 0.001509172000169201,
"children": {
"RLTrainer._checkpoint": {
"total": 0.08258419599997069,
"count": 1,
"self": 0.08258419599997069
}
}
}
}
}
}
}