poca-SoccerTwos-v2 / run_logs /timers.json

First Push

5eb5fdb almost 2 years ago

20.2 kB

	{
	"name": "root",
	"gauges": {
	"SoccerTwos.Policy.Entropy.mean": {
	"value": 1.556477665901184,
	"min": 1.4710997343063354,
	"max": 3.2958054542541504,
	"count": 1004
	},
	"SoccerTwos.Policy.Entropy.sum": {
	"value": 62707.37109375,
	"min": 57961.21484375,
	"max": 196482.734375,
	"count": 1004
	},
	"SoccerTwos.Environment.EpisodeLength.mean": {
	"value": 63.53896103896104,
	"min": 41.633620689655174,
	"max": 991.0,
	"count": 1004
	},
	"SoccerTwos.Environment.EpisodeLength.sum": {
	"value": 39140.0,
	"min": 36508.0,
	"max": 44136.0,
	"count": 1004
	},
	"SoccerTwos.Self-play.ELO.mean": {
	"value": 1732.9269825569081,
	"min": 1200.3452679053712,
	"max": 1774.4282803625763,
	"count": 1004
	},
	"SoccerTwos.Self-play.ELO.sum": {
	"value": 533741.5106275277,
	"min": 2409.6247172591857,
	"max": 807856.6717437465,
	"count": 1004
	},
	"SoccerTwos.Step.mean": {
	"value": 20079978.0,
	"min": 19958.0,
	"max": 20079978.0,
	"count": 1004
	},
	"SoccerTwos.Step.sum": {
	"value": 20079978.0,
	"min": 19958.0,
	"max": 20079978.0,
	"count": 1004
	},
	"SoccerTwos.Policy.ExtrinsicBaselineEstimate.mean": {
	"value": 0.004693327471613884,
	"min": -0.11002453416585922,
	"max": 0.28316113352775574,
	"count": 1004
	},
	"SoccerTwos.Policy.ExtrinsicBaselineEstimate.sum": {
	"value": 1.4502382278442383,
	"min": -30.891870498657227,
	"max": 87.77995300292969,
	"count": 1004
	},
	"SoccerTwos.Policy.ExtrinsicValueEstimate.mean": {
	"value": 0.0017897997749969363,
	"min": -0.10839186608791351,
	"max": 0.28043779730796814,
	"count": 1004
	},
	"SoccerTwos.Policy.ExtrinsicValueEstimate.sum": {
	"value": 0.5530481338500977,
	"min": -31.57282066345215,
	"max": 86.93571472167969,
	"count": 1004
	},
	"SoccerTwos.Environment.CumulativeReward.mean": {
	"value": 0.0,
	"min": 0.0,
	"max": 0.0,
	"count": 1004
	},
	"SoccerTwos.Environment.CumulativeReward.sum": {
	"value": 0.0,
	"min": 0.0,
	"max": 0.0,
	"count": 1004
	},
	"SoccerTwos.Policy.ExtrinsicReward.mean": {
	"value": 0.07618511224641769,
	"min": -0.3861116267913996,
	"max": 0.7115907681293977,
	"count": 1004
	},
	"SoccerTwos.Policy.ExtrinsicReward.sum": {
	"value": 23.541199684143066,
	"min": -86.69039988517761,
	"max": 151.60579979419708,
	"count": 1004
	},
	"SoccerTwos.Environment.GroupCumulativeReward.mean": {
	"value": 0.07618511224641769,
	"min": -0.3861116267913996,
	"max": 0.7115907681293977,
	"count": 1004
	},
	"SoccerTwos.Environment.GroupCumulativeReward.sum": {
	"value": 23.541199684143066,
	"min": -86.69039988517761,
	"max": 151.60579979419708,
	"count": 1004
	},
	"SoccerTwos.IsTraining.mean": {
	"value": 1.0,
	"min": 1.0,
	"max": 1.0,
	"count": 1004
	},
	"SoccerTwos.IsTraining.sum": {
	"value": 1.0,
	"min": 1.0,
	"max": 1.0,
	"count": 1004
	},
	"SoccerTwos.Losses.PolicyLoss.mean": {
	"value": 0.01931103996466845,
	"min": 0.011364540978199026,
	"max": 0.02613362636960422,
	"count": 972
	},
	"SoccerTwos.Losses.PolicyLoss.sum": {
	"value": 0.01931103996466845,
	"min": 0.011364540978199026,
	"max": 0.02613362636960422,
	"count": 972
	},
	"SoccerTwos.Losses.ValueLoss.mean": {
	"value": 0.10091944734255473,
	"min": 0.0017891564697492869,
	"max": 0.1364498645067215,
	"count": 972
	},
	"SoccerTwos.Losses.ValueLoss.sum": {
	"value": 0.10091944734255473,
	"min": 0.0017891564697492869,
	"max": 0.1364498645067215,
	"count": 972
	},
	"SoccerTwos.Losses.BaselineLoss.mean": {
	"value": 0.10318002626299858,
	"min": 0.0017857251921668648,
	"max": 0.1403713325659434,
	"count": 972
	},
	"SoccerTwos.Losses.BaselineLoss.sum": {
	"value": 0.10318002626299858,
	"min": 0.0017857251921668648,
	"max": 0.1403713325659434,
	"count": 972
	},
	"SoccerTwos.Policy.LearningRate.mean": {
	"value": 0.0003,
	"min": 0.0003,
	"max": 0.0003,
	"count": 972
	},
	"SoccerTwos.Policy.LearningRate.sum": {
	"value": 0.0003,
	"min": 0.0003,
	"max": 0.0003,
	"count": 972
	},
	"SoccerTwos.Policy.Epsilon.mean": {
	"value": 0.20000000000000007,
	"min": 0.19999999999999996,
	"max": 0.20000000000000007,
	"count": 972
	},
	"SoccerTwos.Policy.Epsilon.sum": {
	"value": 0.20000000000000007,
	"min": 0.19999999999999996,
	"max": 0.20000000000000007,
	"count": 972
	},
	"SoccerTwos.Policy.Beta.mean": {
	"value": 0.005000000000000001,
	"min": 0.005,
	"max": 0.005000000000000001,
	"count": 972
	},
	"SoccerTwos.Policy.Beta.sum": {
	"value": 0.005000000000000001,
	"min": 0.005,
	"max": 0.005000000000000001,
	"count": 972
	}
	},
	"metadata": {
	"timer_format_version": "0.1.0",
	"start_time_seconds": "1675383867",
	"python_version": "3.8.16 (default, Jan 17 2023, 23:13:24) \n[GCC 11.2.0]",
	"command_line_arguments": "/home/lakoc/anaconda3/envs/rl/bin/mlagents-learn ./config/poca/SoccerTwos.yaml --env=./training-envs-executables/SoccerTwos.x86_64 --run-id=SoccerTwos --no-graphics --force",
	"mlagents_version": "0.31.0.dev0",
	"mlagents_envs_version": "0.31.0.dev0",
	"communication_protocol_version": "1.5.0",
	"pytorch_version": "1.8.1+cu102",
	"numpy_version": "1.21.2",
	"end_time_seconds": "1675426774"
	},
	"total": 42906.562987696,
	"count": 1,
	"self": 0.059106691005581524,
	"children": {
	"run_training.setup": {
	"total": 0.0076704550001522875,
	"count": 1,
	"self": 0.0076704550001522875
	},
	"TrainerController.start_learning": {
	"total": 42906.496210549994,
	"count": 1,
	"self": 31.493490309010667,
	"children": {
	"TrainerController._reset_env": {
	"total": 3.7668858350125447,
	"count": 41,
	"self": 3.7668858350125447
	},
	"TrainerController.advance": {
	"total": 42870.95981721497,
	"count": 1379994,
	"self": 32.439994623477105,
	"children": {
	"env_step": {
	"total": 27018.915252399358,
	"count": 1379994,
	"self": 21046.866747180986,
	"children": {
	"SubprocessEnvManager._take_step": {
	"total": 5952.585262612341,
	"count": 1379994,
	"self": 161.70714837239848,
	"children": {
	"TorchPolicy.evaluate": {
	"total": 5790.878114239942,
	"count": 2515149,
	"self": 5790.878114239942
	}
	}
	},
	"workers": {
	"total": 19.4632426060316,
	"count": 1379993,
	"self": 0.0,
	"children": {
	"worker_root": {
	"total": 42851.82584652449,
	"count": 1379993,
	"is_parallel": true,
	"self": 25313.08857872712,
	"children": {
	"run_training.setup": {
	"total": 0.0,
	"count": 0,
	"is_parallel": true,
	"self": 0.0,
	"children": {
	"steps_from_proto": {
	"total": 0.0036851349996140925,
	"count": 2,
	"is_parallel": true,
	"self": 0.0008368140006496105,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 0.002848320998964482,
	"count": 8,
	"is_parallel": true,
	"self": 0.002848320998964482
	}
	}
	},
	"UnityEnvironment.step": {
	"total": 0.02670044400019833,
	"count": 1,
	"is_parallel": true,
	"self": 0.0005669430011039367,
	"children": {
	"UnityEnvironment._generate_step_input": {
	"total": 0.0005311969998729182,
	"count": 1,
	"is_parallel": true,
	"self": 0.0005311969998729182
	},
	"communicator.exchange": {
	"total": 0.023805957000149647,
	"count": 1,
	"is_parallel": true,
	"self": 0.023805957000149647
	},
	"steps_from_proto": {
	"total": 0.0017963469990718295,
	"count": 2,
	"is_parallel": true,
	"self": 0.0003687569997055107,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 0.0014275899993663188,
	"count": 8,
	"is_parallel": true,
	"self": 0.0014275899993663188
	}
	}
	}
	}
	}
	}
	},
	"UnityEnvironment.step": {
	"total": 17538.654487297365,
	"count": 1379992,
	"is_parallel": true,
	"self": 926.6944915361855,
	"children": {
	"UnityEnvironment._generate_step_input": {
	"total": 594.502346487754,
	"count": 1379992,
	"is_parallel": true,
	"self": 594.502346487754
	},
	"communicator.exchange": {
	"total": 13301.6280554498,
	"count": 1379992,
	"is_parallel": true,
	"self": 13301.6280554498
	},
	"steps_from_proto": {
	"total": 2715.8295938236242,
	"count": 2759984,
	"is_parallel": true,
	"self": 493.823149779153,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 2222.006444044471,
	"count": 11039936,
	"is_parallel": true,
	"self": 2222.006444044471
	}
	}
	}
	}
	},
	"steps_from_proto": {
	"total": 0.08278050000080839,
	"count": 80,
	"is_parallel": true,
	"self": 0.014847281085167197,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 0.06793321891564119,
	"count": 320,
	"is_parallel": true,
	"self": 0.06793321891564119
	}
	}
	}
	}
	}
	}
	}
	}
	},
	"trainer_advance": {
	"total": 15819.604570192136,
	"count": 1379993,
	"self": 196.98733306854228,
	"children": {
	"process_trajectory": {
	"total": 4098.746716667649,
	"count": 1379993,
	"self": 4088.766313262644,
	"children": {
	"RLTrainer._checkpoint": {
	"total": 9.980403405004836,
	"count": 40,
	"self": 9.980403405004836
	}
	}
	},
	"_update_policy": {
	"total": 11523.870520455945,
	"count": 973,
	"self": 2655.3542703912135,
	"children": {
	"TorchPOCAOptimizer.update": {
	"total": 8868.516250064731,
	"count": 29202,
	"self": 8868.516250064731
	}
	}
	}
	}
	}
	}
	},
	"trainer_threads": {
	"total": 1.4309989637695253e-06,
	"count": 1,
	"self": 1.4309989637695253e-06
	},
	"TrainerController._save_models": {
	"total": 0.27601575999869965,
	"count": 1,
	"self": 0.003253094997489825,
	"children": {
	"RLTrainer._checkpoint": {
	"total": 0.2727626650012098,
	"count": 1,
	"self": 0.2727626650012098
	}
	}
	}
	}
	}
	}
	}