{ "name": "root", "gauges": { "SoccerTwos.Policy.Entropy.mean": { "value": 2.0213615894317627, "min": 2.009491443634033, "max": 3.2956788539886475, "count": 500 }, "SoccerTwos.Policy.Entropy.sum": { "value": 38939.51171875, "min": 19765.470703125, "max": 154643.203125, "count": 500 }, "SoccerTwos.Environment.EpisodeLength.mean": { "value": 75.31818181818181, "min": 51.45744680851064, "max": 999.0, "count": 500 }, "SoccerTwos.Environment.EpisodeLength.sum": { "value": 19884.0, "min": 7992.0, "max": 29044.0, "count": 500 }, "SoccerTwos.Self-play.ELO.mean": { "value": 1530.8731346255302, "min": 1159.7741687804314, "max": 1546.65543014195, "count": 459 }, "SoccerTwos.Self-play.ELO.sum": { "value": 202075.25377056998, "min": 2321.067814248583, "max": 281538.77394771576, "count": 459 }, "SoccerTwos.Step.mean": { "value": 4999933.0, "min": 9540.0, "max": 4999933.0, "count": 500 }, "SoccerTwos.Step.sum": { "value": 4999933.0, "min": 9540.0, "max": 4999933.0, "count": 500 }, "SoccerTwos.Policy.ExtrinsicBaselineEstimate.mean": { "value": -0.006711859721690416, "min": -0.07943391799926758, "max": 0.18840113282203674, "count": 500 }, "SoccerTwos.Policy.ExtrinsicBaselineEstimate.sum": { "value": -0.8859654664993286, "min": -11.772872924804688, "max": 26.376157760620117, "count": 500 }, "SoccerTwos.Policy.ExtrinsicValueEstimate.mean": { "value": -0.0078003061935305595, "min": -0.07678192853927612, "max": 0.18508915603160858, "count": 500 }, "SoccerTwos.Policy.ExtrinsicValueEstimate.sum": { "value": -1.0296404361724854, "min": -11.542649269104004, "max": 25.9124813079834, "count": 500 }, "SoccerTwos.Environment.CumulativeReward.mean": { "value": 0.0, "min": 0.0, "max": 0.0, "count": 500 }, "SoccerTwos.Environment.CumulativeReward.sum": { "value": 0.0, "min": 0.0, "max": 0.0, "count": 500 }, "SoccerTwos.Policy.ExtrinsicReward.mean": { "value": 0.09212424177112001, "min": -0.5714285714285714, "max": 0.5371563597158953, "count": 500 }, "SoccerTwos.Policy.ExtrinsicReward.sum": { "value": 12.160399913787842, "min": -37.384000301361084, "max": 47.07479953765869, "count": 500 }, "SoccerTwos.Environment.GroupCumulativeReward.mean": { "value": 0.09212424177112001, "min": -0.5714285714285714, "max": 0.5371563597158953, "count": 500 }, "SoccerTwos.Environment.GroupCumulativeReward.sum": { "value": 12.160399913787842, "min": -37.384000301361084, "max": 47.07479953765869, "count": 500 }, "SoccerTwos.IsTraining.mean": { "value": 1.0, "min": 1.0, "max": 1.0, "count": 500 }, "SoccerTwos.IsTraining.sum": { "value": 1.0, "min": 1.0, "max": 1.0, "count": 500 }, "SoccerTwos.Losses.PolicyLoss.mean": { "value": 0.0227650248639596, "min": 0.009874877380449712, "max": 0.025181998672072343, "count": 238 }, "SoccerTwos.Losses.PolicyLoss.sum": { "value": 0.0227650248639596, "min": 0.009874877380449712, "max": 0.025181998672072343, "count": 238 }, "SoccerTwos.Losses.ValueLoss.mean": { "value": 0.08372622231642406, "min": 2.12503995650574e-06, "max": 0.09860104198257129, "count": 238 }, "SoccerTwos.Losses.ValueLoss.sum": { "value": 0.08372622231642406, "min": 2.12503995650574e-06, "max": 0.09860104198257129, "count": 238 }, "SoccerTwos.Losses.BaselineLoss.mean": { "value": 0.08488952120145161, "min": 2.1953862111937874e-06, "max": 0.1005101685722669, "count": 238 }, "SoccerTwos.Losses.BaselineLoss.sum": { "value": 0.08488952120145161, "min": 2.1953862111937874e-06, "max": 0.1005101685722669, "count": 238 }, "SoccerTwos.Policy.LearningRate.mean": { "value": 0.0003, "min": 0.0003, "max": 0.0003, "count": 238 }, "SoccerTwos.Policy.LearningRate.sum": { "value": 0.0003, "min": 0.0003, "max": 0.0003, "count": 238 }, "SoccerTwos.Policy.Epsilon.mean": { "value": 0.20000000000000007, "min": 0.20000000000000004, "max": 0.20000000000000007, "count": 238 }, "SoccerTwos.Policy.Epsilon.sum": { "value": 0.20000000000000007, "min": 0.20000000000000004, "max": 0.20000000000000007, "count": 238 }, "SoccerTwos.Policy.Beta.mean": { "value": 0.005000000000000001, "min": 0.005000000000000001, "max": 0.005000000000000001, "count": 238 }, "SoccerTwos.Policy.Beta.sum": { "value": 0.005000000000000001, "min": 0.005000000000000001, "max": 0.005000000000000001, "count": 238 } }, "metadata": { "timer_format_version": "0.1.0", "start_time_seconds": "1675700579", "python_version": "3.9.16 | packaged by conda-forge | (main, Feb 1 2023, 21:28:38) [MSC v.1929 64 bit (AMD64)]", "command_line_arguments": "E:\\ProgramData\\Miniconda3\\envs\\rl_hf\\Scripts\\mlagents-learn ./config/poca/SoccerTwos.yaml --env=./training-envs-executables/SoccerTwos.exe --run-id=SoccerTwos --no-graphics", "mlagents_version": "0.31.0.dev0", "mlagents_envs_version": "0.31.0.dev0", "communication_protocol_version": "1.5.0", "pytorch_version": "1.13.1+cpu", "numpy_version": "1.21.2", "end_time_seconds": "1675721577" }, "total": 20997.972567, "count": 1, "self": 0.7350547999994888, "children": { "run_training.setup": { "total": 0.08352039999999983, "count": 1, "self": 0.08352039999999983 }, "TrainerController.start_learning": { "total": 20997.1539918, "count": 1, "self": 10.351660299456853, "children": { "TrainerController._reset_env": { "total": 4.556975699996396, "count": 25, "self": 4.556975699996396 }, "TrainerController.advance": { "total": 20982.06151190055, "count": 333375, "self": 10.567984800814884, "children": { "env_step": { "total": 6646.6473090000845, "count": 333375, "self": 5007.922153899531, "children": { "SubprocessEnvManager._take_step": { "total": 1632.6026722003107, "count": 333375, "self": 63.33631170102626, "children": { "TorchPolicy.evaluate": { "total": 1569.2663604992845, "count": 636786, "self": 1569.2663604992845 } } }, "workers": { "total": 6.122482900242986, "count": 333375, "self": 0.0, "children": { "worker_root": { "total": 20979.775855499633, "count": 333375, "is_parallel": true, "self": 17063.27428249941, "children": { "steps_from_proto": { "total": 0.05782670000149581, "count": 50, "is_parallel": true, "self": 0.012298500004381374, "children": { "_process_rank_one_or_two_observation": { "total": 0.04552819999711444, "count": 200, "is_parallel": true, "self": 0.04552819999711444 } } }, "UnityEnvironment.step": { "total": 3916.443746300221, "count": 333375, "is_parallel": true, "self": 210.33805879946203, "children": { "UnityEnvironment._generate_step_input": { "total": 174.12952240006086, "count": 333375, "is_parallel": true, "self": 174.12952240006086 }, "communicator.exchange": { "total": 2840.075861300319, "count": 333375, "is_parallel": true, "self": 2840.075861300319 }, "steps_from_proto": { "total": 691.9003038003789, "count": 666750, "is_parallel": true, "self": 147.23733259858454, "children": { "_process_rank_one_or_two_observation": { "total": 544.6629712017943, "count": 2667000, "is_parallel": true, "self": 544.6629712017943 } } } } } } } } } } }, "trainer_advance": { "total": 14324.846218099648, "count": 333375, "self": 68.94114420022379, "children": { "process_trajectory": { "total": 1739.43297689941, "count": 333375, "self": 1736.6504571994114, "children": { "RLTrainer._checkpoint": { "total": 2.782519699998602, "count": 10, "self": 2.782519699998602 } } }, "_update_policy": { "total": 12516.472097000014, "count": 238, "self": 1058.2553322000622, "children": { "TorchPOCAOptimizer.update": { "total": 11458.216764799952, "count": 7149, "self": 11458.216764799952 } } } } } } }, "trainer_threads": { "total": 1.0000003385357559e-06, "count": 1, "self": 1.0000003385357559e-06 }, "TrainerController._save_models": { "total": 0.18384289999812609, "count": 1, "self": 0.00261540000064997, "children": { "RLTrainer._checkpoint": { "total": 0.18122749999747612, "count": 1, "self": 0.18122749999747612 } } } } } } }