{ "name": "root", "gauges": { "SoccerTwos.Policy.Entropy.mean": { "value": 1.5969356298446655, "min": 1.5406135320663452, "max": 3.2957420349121094, "count": 1000 }, "SoccerTwos.Policy.Entropy.sum": { "value": 32807.4453125, "min": 22233.03515625, "max": 119406.3984375, "count": 1000 }, "SoccerTwos.Environment.EpisodeLength.mean": { "value": 52.81720430107527, "min": 40.56198347107438, "max": 999.0, "count": 1000 }, "SoccerTwos.Environment.EpisodeLength.sum": { "value": 19648.0, "min": 14076.0, "max": 23844.0, "count": 1000 }, "SoccerTwos.Self-play.ELO.mean": { "value": 1555.4992597326595, "min": 1190.120050817967, "max": 1604.2552553318303, "count": 992 }, "SoccerTwos.Self-play.ELO.sum": { "value": 289322.8623102747, "min": 2394.009544151198, "max": 379028.06362600107, "count": 992 }, "SoccerTwos.Step.mean": { "value": 9999972.0, "min": 9174.0, "max": 9999972.0, "count": 1000 }, "SoccerTwos.Step.sum": { "value": 9999972.0, "min": 9174.0, "max": 9999972.0, "count": 1000 }, "SoccerTwos.Policy.ExtrinsicBaselineEstimate.mean": { "value": -0.014413188211619854, "min": -0.12347006052732468, "max": 0.12490702420473099, "count": 1000 }, "SoccerTwos.Policy.ExtrinsicBaselineEstimate.sum": { "value": -2.6664397716522217, "min": -24.955711364746094, "max": 17.15989875793457, "count": 1000 }, "SoccerTwos.Policy.ExtrinsicValueEstimate.mean": { "value": -0.010898062027990818, "min": -0.12485354393720627, "max": 0.12470623850822449, "count": 1000 }, "SoccerTwos.Policy.ExtrinsicValueEstimate.sum": { "value": -2.016141414642334, "min": -24.727825164794922, "max": 16.87221908569336, "count": 1000 }, "SoccerTwos.Environment.CumulativeReward.mean": { "value": 0.0, "min": 0.0, "max": 0.0, "count": 1000 }, "SoccerTwos.Environment.CumulativeReward.sum": { "value": 0.0, "min": 0.0, "max": 0.0, "count": 1000 }, "SoccerTwos.Policy.ExtrinsicReward.mean": { "value": 0.13524540566109322, "min": -0.5605333337077388, "max": 0.41887500137090683, "count": 1000 }, "SoccerTwos.Policy.ExtrinsicReward.sum": { "value": 25.020400047302246, "min": -56.325600147247314, "max": 54.54360020160675, "count": 1000 }, "SoccerTwos.Environment.GroupCumulativeReward.mean": { "value": 0.13524540566109322, "min": -0.5605333337077388, "max": 0.41887500137090683, "count": 1000 }, "SoccerTwos.Environment.GroupCumulativeReward.sum": { "value": 25.020400047302246, "min": -56.325600147247314, "max": 54.54360020160675, "count": 1000 }, "SoccerTwos.IsTraining.mean": { "value": 1.0, "min": 1.0, "max": 1.0, "count": 1000 }, "SoccerTwos.IsTraining.sum": { "value": 1.0, "min": 1.0, "max": 1.0, "count": 1000 }, "SoccerTwos.Losses.PolicyLoss.mean": { "value": 0.02141846805801227, "min": 0.010343785071745515, "max": 0.02435030248016119, "count": 482 }, "SoccerTwos.Losses.PolicyLoss.sum": { "value": 0.02141846805801227, "min": 0.010343785071745515, "max": 0.02435030248016119, "count": 482 }, "SoccerTwos.Losses.ValueLoss.mean": { "value": 0.10125019202629724, "min": 0.00030965355545049534, "max": 0.12248869289954503, "count": 482 }, "SoccerTwos.Losses.ValueLoss.sum": { "value": 0.10125019202629724, "min": 0.00030965355545049534, "max": 0.12248869289954503, "count": 482 }, "SoccerTwos.Losses.BaselineLoss.mean": { "value": 0.10259012083212535, "min": 0.00030871983423518635, "max": 0.12475258807341258, "count": 482 }, "SoccerTwos.Losses.BaselineLoss.sum": { "value": 0.10259012083212535, "min": 0.00030871983423518635, "max": 0.12475258807341258, "count": 482 }, "SoccerTwos.Policy.LearningRate.mean": { "value": 0.0003, "min": 0.0003, "max": 0.0003, "count": 482 }, "SoccerTwos.Policy.LearningRate.sum": { "value": 0.0003, "min": 0.0003, "max": 0.0003, "count": 482 }, "SoccerTwos.Policy.Epsilon.mean": { "value": 0.20000000000000007, "min": 0.20000000000000007, "max": 0.20000000000000007, "count": 482 }, "SoccerTwos.Policy.Epsilon.sum": { "value": 0.20000000000000007, "min": 0.20000000000000007, "max": 0.20000000000000007, "count": 482 }, "SoccerTwos.Policy.Beta.mean": { "value": 0.005000000000000001, "min": 0.005000000000000001, "max": 0.005000000000000001, "count": 482 }, "SoccerTwos.Policy.Beta.sum": { "value": 0.005000000000000001, "min": 0.005000000000000001, "max": 0.005000000000000001, "count": 482 } }, "metadata": { "timer_format_version": "0.1.0", "start_time_seconds": "1694708790", "python_version": "3.9.18 | packaged by conda-forge | (main, Aug 30 2023, 03:49:32) \n[GCC 12.3.0]", "command_line_arguments": "/home/terps/mambaforge/envs/rl/bin/mlagents-learn ./config/poca/SoccerTwos.yaml --env=./training-envs-executables/SoccerTwos/SoccerTwos.x86_64 --run-id=SoccerTwos --no-graphics --force", "mlagents_version": "0.31.0.dev0", "mlagents_envs_version": "0.31.0.dev0", "communication_protocol_version": "1.5.0", "pytorch_version": "1.11.0+cu102", "numpy_version": "1.21.2", "end_time_seconds": "1694736508" }, "total": 27718.452107893998, "count": 1, "self": 1.7995216749986866, "children": { "run_training.setup": { "total": 0.012232699999003671, "count": 1, "self": 0.012232699999003671 }, "TrainerController.start_learning": { "total": 27716.640353519, "count": 1, "self": 19.2576742155361, "children": { "TrainerController._reset_env": { "total": 8.84835274298166, "count": 21, "self": 8.84835274298166 }, "TrainerController.advance": { "total": 27688.247795048483, "count": 680429, "self": 19.05893027050115, "children": { "env_step": { "total": 22157.30852160375, "count": 680429, "self": 15638.15256235451, "children": { "SubprocessEnvManager._take_step": { "total": 6507.746948996195, "count": 680429, "self": 113.61552996908722, "children": { "TorchPolicy.evaluate": { "total": 6394.131419027108, "count": 1254764, "self": 6394.131419027108 } } }, "workers": { "total": 11.40901025304629, "count": 680428, "self": 0.0, "children": { "worker_root": { "total": 27672.763382924164, "count": 680428, "is_parallel": true, "self": 14029.47554577728, "children": { "run_training.setup": { "total": 0.0, "count": 0, "is_parallel": true, "self": 0.0, "children": { "steps_from_proto": { "total": 0.007280599998921389, "count": 2, "is_parallel": true, "self": 0.005340200004866347, "children": { "_process_rank_one_or_two_observation": { "total": 0.001940399994055042, "count": 8, "is_parallel": true, "self": 0.001940399994055042 } } }, "UnityEnvironment.step": { "total": 0.03416270000161603, "count": 1, "is_parallel": true, "self": 0.0006320999964373186, "children": { "UnityEnvironment._generate_step_input": { "total": 0.0005296000017551705, "count": 1, "is_parallel": true, "self": 0.0005296000017551705 }, "communicator.exchange": { "total": 0.031072600002516992, "count": 1, "is_parallel": true, "self": 0.031072600002516992 }, "steps_from_proto": { "total": 0.0019284000009065494, "count": 2, "is_parallel": true, "self": 0.00048099999912665226, "children": { "_process_rank_one_or_two_observation": { "total": 0.0014474000017798971, "count": 8, "is_parallel": true, "self": 0.0014474000017798971 } } } } } } }, "UnityEnvironment.step": { "total": 13643.25105359788, "count": 680427, "is_parallel": true, "self": 402.79831428049874, "children": { "UnityEnvironment._generate_step_input": { "total": 276.44210654751805, "count": 680427, "is_parallel": true, "self": 276.44210654751805 }, "communicator.exchange": { "total": 11742.215522667906, "count": 680427, "is_parallel": true, "self": 11742.215522667906 }, "steps_from_proto": { "total": 1221.795110101957, "count": 1360854, "is_parallel": true, "self": 273.6090259386874, "children": { "_process_rank_one_or_two_observation": { "total": 948.1860841632697, "count": 5443416, "is_parallel": true, "self": 948.1860841632697 } } } } }, "steps_from_proto": { "total": 0.03678354900330305, "count": 40, "is_parallel": true, "self": 0.008402747000218369, "children": { "_process_rank_one_or_two_observation": { "total": 0.028380802003084682, "count": 160, "is_parallel": true, "self": 0.028380802003084682 } } } } } } } } }, "trainer_advance": { "total": 5511.880343174231, "count": 680428, "self": 128.80195408420332, "children": { "process_trajectory": { "total": 2575.0881813440137, "count": 680428, "self": 2568.601877004996, "children": { "RLTrainer._checkpoint": { "total": 6.486304339017806, "count": 20, "self": 6.486304339017806 } } }, "_update_policy": { "total": 2807.9902077460138, "count": 483, "self": 1697.4578579989175, "children": { "TorchPOCAOptimizer.update": { "total": 1110.5323497470963, "count": 14490, "self": 1110.5323497470963 } } } } } } }, "trainer_threads": { "total": 1.5999976312741637e-06, "count": 1, "self": 1.5999976312741637e-06 }, "TrainerController._save_models": { "total": 0.28652991200215183, "count": 1, "self": 0.002179615003115032, "children": { "RLTrainer._checkpoint": { "total": 0.2843502969990368, "count": 1, "self": 0.2843502969990368 } } } } } } }