First Push

d156634 12 months ago

18.7 kB

	{
	"name": "root",
	"gauges": {
	"Pyramids.Policy.Entropy.mean": {
	"value": 0.43953874707221985,
	"min": 0.42135411500930786,
	"max": 1.434498906135559,
	"count": 33
	},
	"Pyramids.Policy.Entropy.sum": {
	"value": 13312.75,
	"min": 12499.048828125,
	"max": 43516.95703125,
	"count": 33
	},
	"Pyramids.Step.mean": {
	"value": 989876.0,
	"min": 29908.0,
	"max": 989876.0,
	"count": 33
	},
	"Pyramids.Step.sum": {
	"value": 989876.0,
	"min": 29908.0,
	"max": 989876.0,
	"count": 33
	},
	"Pyramids.Policy.ExtrinsicValueEstimate.mean": {
	"value": 0.3469477593898773,
	"min": -0.09750516712665558,
	"max": 0.3469477593898773,
	"count": 33
	},
	"Pyramids.Policy.ExtrinsicValueEstimate.sum": {
	"value": 90.90031433105469,
	"min": -23.49874496459961,
	"max": 90.90031433105469,
	"count": 33
	},
	"Pyramids.Policy.RndValueEstimate.mean": {
	"value": 0.04918583109974861,
	"min": -0.00609207758679986,
	"max": 0.3285600244998932,
	"count": 33
	},
	"Pyramids.Policy.RndValueEstimate.sum": {
	"value": 12.886688232421875,
	"min": -1.4925589561462402,
	"max": 77.86872863769531,
	"count": 33
	},
	"Pyramids.Losses.PolicyLoss.mean": {
	"value": 0.06638421378508545,
	"min": 0.0657467637098582,
	"max": 0.07561135002938868,
	"count": 33
	},
	"Pyramids.Losses.PolicyLoss.sum": {
	"value": 0.9957632067762817,
	"min": 0.5870415161973802,
	"max": 1.0853670877986588,
	"count": 33
	},
	"Pyramids.Losses.ValueLoss.mean": {
	"value": 0.012467502224813765,
	"min": 0.0005424294119835732,
	"max": 0.012474717255047705,
	"count": 33
	},
	"Pyramids.Losses.ValueLoss.sum": {
	"value": 0.18701253337220647,
	"min": 0.007594011767770025,
	"max": 0.18701253337220647,
	"count": 33
	},
	"Pyramids.Policy.LearningRate.mean": {
	"value": 7.577057474346671e-06,
	"min": 7.577057474346671e-06,
	"max": 0.00029484495171835,
	"count": 33
	},
	"Pyramids.Policy.LearningRate.sum": {
	"value": 0.00011365586211520007,
	"min": 0.00011365586211520007,
	"max": 0.0036331843889386003,
	"count": 33
	},
	"Pyramids.Policy.Epsilon.mean": {
	"value": 0.10252565333333337,
	"min": 0.10252565333333337,
	"max": 0.19828165,
	"count": 33
	},
	"Pyramids.Policy.Epsilon.sum": {
	"value": 1.5378848000000005,
	"min": 1.4783222000000003,
	"max": 2.6110613999999996,
	"count": 33
	},
	"Pyramids.Policy.Beta.mean": {
	"value": 0.00026231276800000013,
	"min": 0.00026231276800000013,
	"max": 0.009828336835,
	"count": 33
	},
	"Pyramids.Policy.Beta.sum": {
	"value": 0.003934691520000002,
	"min": 0.003934691520000002,
	"max": 0.12112503386000001,
	"count": 33
	},
	"Pyramids.Losses.RNDLoss.mean": {
	"value": 0.012602363713085651,
	"min": 0.012602363713085651,
	"max": 0.44268977642059326,
	"count": 33
	},
	"Pyramids.Losses.RNDLoss.sum": {
	"value": 0.18903546035289764,
	"min": 0.1861698180437088,
	"max": 3.541518211364746,
	"count": 33
	},
	"Pyramids.Environment.EpisodeLength.mean": {
	"value": 462.77777777777777,
	"min": 462.77777777777777,
	"max": 990.8484848484849,
	"count": 33
	},
	"Pyramids.Environment.EpisodeLength.sum": {
	"value": 29155.0,
	"min": 16451.0,
	"max": 32940.0,
	"count": 33
	},
	"Pyramids.Environment.CumulativeReward.mean": {
	"value": 1.3149333078236807,
	"min": -0.9311636887264975,
	"max": 1.3149333078236807,
	"count": 33
	},
	"Pyramids.Environment.CumulativeReward.sum": {
	"value": 82.84079839289188,
	"min": -30.728401727974415,
	"max": 82.84079839289188,
	"count": 33
	},
	"Pyramids.Policy.ExtrinsicReward.mean": {
	"value": 1.3149333078236807,
	"min": -0.9311636887264975,
	"max": 1.3149333078236807,
	"count": 33
	},
	"Pyramids.Policy.ExtrinsicReward.sum": {
	"value": 82.84079839289188,
	"min": -30.728401727974415,
	"max": 82.84079839289188,
	"count": 33
	},
	"Pyramids.Policy.RndReward.mean": {
	"value": 0.060952933739856004,
	"min": 0.060952933739856004,
	"max": 8.373383240664706,
	"count": 33
	},
	"Pyramids.Policy.RndReward.sum": {
	"value": 3.8400348256109282,
	"min": 3.8400348256109282,
	"max": 142.3475150913,
	"count": 33
	},
	"Pyramids.IsTraining.mean": {
	"value": 1.0,
	"min": 1.0,
	"max": 1.0,
	"count": 33
	},
	"Pyramids.IsTraining.sum": {
	"value": 1.0,
	"min": 1.0,
	"max": 1.0,
	"count": 33
	}
	},
	"metadata": {
	"timer_format_version": "0.1.0",
	"start_time_seconds": "1702903524",
	"python_version": "3.10.12 (main, Nov 20 2023, 15:14:05) [GCC 11.4.0]",
	"command_line_arguments": "/usr/local/bin/mlagents-learn ./config/ppo/PyramidsRND.yaml --env=./training-envs-executables/linux/Pyramids/Pyramids --run-id=Pyramids Training --no-graphics",
	"mlagents_version": "1.1.0.dev0",
	"mlagents_envs_version": "1.1.0.dev0",
	"communication_protocol_version": "1.5.0",
	"pytorch_version": "2.1.2+cu121",
	"numpy_version": "1.23.5",
	"end_time_seconds": "1702905599"
	},
	"total": 2075.0884569010004,
	"count": 1,
	"self": 0.8340091170007327,
	"children": {
	"run_training.setup": {
	"total": 0.07078064799998174,
	"count": 1,
	"self": 0.07078064799998174
	},
	"TrainerController.start_learning": {
	"total": 2074.1836671359997,
	"count": 1,
	"self": 1.3587929349923797,
	"children": {
	"TrainerController._reset_env": {
	"total": 2.1862086329999784,
	"count": 1,
	"self": 2.1862086329999784
	},
	"TrainerController.advance": {
	"total": 2070.5545712880066,
	"count": 63433,
	"self": 1.4231073369774094,
	"children": {
	"env_step": {
	"total": 1454.6072410219901,
	"count": 63433,
	"self": 1323.446675419085,
	"children": {
	"SubprocessEnvManager._take_step": {
	"total": 130.33998160494707,
	"count": 63433,
	"self": 4.733357381888027,
	"children": {
	"TorchPolicy.evaluate": {
	"total": 125.60662422305904,
	"count": 62563,
	"self": 125.60662422305904
	}
	}
	},
	"workers": {
	"total": 0.8205839979580105,
	"count": 63433,
	"self": 0.0,
	"children": {
	"worker_root": {
	"total": 2069.217339483954,
	"count": 63433,
	"is_parallel": true,
	"self": 864.1328929329115,
	"children": {
	"run_training.setup": {
	"total": 0.0,
	"count": 0,
	"is_parallel": true,
	"self": 0.0,
	"children": {
	"steps_from_proto": {
	"total": 0.0017604189999929076,
	"count": 1,
	"is_parallel": true,
	"self": 0.0005545830001665308,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 0.0012058359998263768,
	"count": 8,
	"is_parallel": true,
	"self": 0.0012058359998263768
	}
	}
	},
	"UnityEnvironment.step": {
	"total": 0.04853810299982797,
	"count": 1,
	"is_parallel": true,
	"self": 0.0005642249998345505,
	"children": {
	"UnityEnvironment._generate_step_input": {
	"total": 0.00046031800002310774,
	"count": 1,
	"is_parallel": true,
	"self": 0.00046031800002310774
	},
	"communicator.exchange": {
	"total": 0.045917056000007506,
	"count": 1,
	"is_parallel": true,
	"self": 0.045917056000007506
	},
	"steps_from_proto": {
	"total": 0.0015965039999628061,
	"count": 1,
	"is_parallel": true,
	"self": 0.00034127900062230765,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 0.0012552249993404985,
	"count": 8,
	"is_parallel": true,
	"self": 0.0012552249993404985
	}
	}
	}
	}
	}
	}
	},
	"UnityEnvironment.step": {
	"total": 1205.0844465510427,
	"count": 63432,
	"is_parallel": true,
	"self": 34.566660914052136,
	"children": {
	"UnityEnvironment._generate_step_input": {
	"total": 24.442632394963084,
	"count": 63432,
	"is_parallel": true,
	"self": 24.442632394963084
	},
	"communicator.exchange": {
	"total": 1047.2239439030443,
	"count": 63432,
	"is_parallel": true,
	"self": 1047.2239439030443
	},
	"steps_from_proto": {
	"total": 98.85120933898315,
	"count": 63432,
	"is_parallel": true,
	"self": 19.95006917710134,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 78.90114016188181,
	"count": 507456,
	"is_parallel": true,
	"self": 78.90114016188181
	}
	}
	}
	}
	}
	}
	}
	}
	}
	}
	},
	"trainer_advance": {
	"total": 614.5242229290388,
	"count": 63433,
	"self": 2.6567191330489095,
	"children": {
	"process_trajectory": {
	"total": 123.2409316149899,
	"count": 63433,
	"self": 123.0471291259903,
	"children": {
	"RLTrainer._checkpoint": {
	"total": 0.1938024889996086,
	"count": 2,
	"self": 0.1938024889996086
	}
	}
	},
	"_update_policy": {
	"total": 488.62657218100003,
	"count": 454,
	"self": 291.85564948799697,
	"children": {
	"TorchPPOOptimizer.update": {
	"total": 196.77092269300306,
	"count": 22764,
	"self": 196.77092269300306
	}
	}
	}
	}
	}
	}
	},
	"trainer_threads": {
	"total": 9.120003596763127e-07,
	"count": 1,
	"self": 9.120003596763127e-07
	},
	"TrainerController._save_models": {
	"total": 0.08409336800013989,
	"count": 1,
	"self": 0.001509172000169201,
	"children": {
	"RLTrainer._checkpoint": {
	"total": 0.08258419599997069,
	"count": 1,
	"self": 0.08258419599997069
	}
	}
	}
	}
	}
	}
	}