|
{ |
|
"name": "root", |
|
"gauges": { |
|
"SoccerTwos.Policy.Entropy.mean": { |
|
"value": 2.1323177814483643, |
|
"min": 2.0925920009613037, |
|
"max": 3.2958126068115234, |
|
"count": 750 |
|
}, |
|
"SoccerTwos.Policy.Entropy.sum": { |
|
"value": 41759.3125, |
|
"min": 18373.73046875, |
|
"max": 135839.296875, |
|
"count": 750 |
|
}, |
|
"SoccerTwos.Environment.EpisodeLength.mean": { |
|
"value": 54.022222222222226, |
|
"min": 46.308411214953274, |
|
"max": 999.0, |
|
"count": 750 |
|
}, |
|
"SoccerTwos.Environment.EpisodeLength.sum": { |
|
"value": 19448.0, |
|
"min": 14020.0, |
|
"max": 28512.0, |
|
"count": 750 |
|
}, |
|
"SoccerTwos.Self-play.ELO.mean": { |
|
"value": 1442.7982170999321, |
|
"min": 1175.8767981610217, |
|
"max": 1442.7982170999321, |
|
"count": 396 |
|
}, |
|
"SoccerTwos.Self-play.ELO.sum": { |
|
"value": 259703.6790779878, |
|
"min": 2353.2776183580017, |
|
"max": 298886.27177008847, |
|
"count": 396 |
|
}, |
|
"SoccerTwos.Step.mean": { |
|
"value": 7499947.0, |
|
"min": 9272.0, |
|
"max": 7499947.0, |
|
"count": 750 |
|
}, |
|
"SoccerTwos.Step.sum": { |
|
"value": 7499947.0, |
|
"min": 9272.0, |
|
"max": 7499947.0, |
|
"count": 750 |
|
}, |
|
"SoccerTwos.Policy.ExtrinsicBaselineEstimate.mean": { |
|
"value": 0.08528007566928864, |
|
"min": -0.08902060240507126, |
|
"max": 0.16198357939720154, |
|
"count": 750 |
|
}, |
|
"SoccerTwos.Policy.ExtrinsicBaselineEstimate.sum": { |
|
"value": 15.435693740844727, |
|
"min": -12.81896686553955, |
|
"max": 28.185142517089844, |
|
"count": 750 |
|
}, |
|
"SoccerTwos.Policy.ExtrinsicValueEstimate.mean": { |
|
"value": 0.09465673565864563, |
|
"min": -0.08676186203956604, |
|
"max": 0.17199347913265228, |
|
"count": 750 |
|
}, |
|
"SoccerTwos.Policy.ExtrinsicValueEstimate.sum": { |
|
"value": 17.132869720458984, |
|
"min": -12.493707656860352, |
|
"max": 29.926864624023438, |
|
"count": 750 |
|
}, |
|
"SoccerTwos.Environment.CumulativeReward.mean": { |
|
"value": 0.0, |
|
"min": 0.0, |
|
"max": 0.0, |
|
"count": 750 |
|
}, |
|
"SoccerTwos.Environment.CumulativeReward.sum": { |
|
"value": 0.0, |
|
"min": 0.0, |
|
"max": 0.0, |
|
"count": 750 |
|
}, |
|
"SoccerTwos.Policy.ExtrinsicReward.mean": { |
|
"value": 0.1420729272273364, |
|
"min": -0.4910444418589274, |
|
"max": 0.4178551661557165, |
|
"count": 750 |
|
}, |
|
"SoccerTwos.Policy.ExtrinsicReward.sum": { |
|
"value": 25.715199828147888, |
|
"min": -37.96260005235672, |
|
"max": 58.661200165748596, |
|
"count": 750 |
|
}, |
|
"SoccerTwos.Environment.GroupCumulativeReward.mean": { |
|
"value": 0.1420729272273364, |
|
"min": -0.4910444418589274, |
|
"max": 0.4178551661557165, |
|
"count": 750 |
|
}, |
|
"SoccerTwos.Environment.GroupCumulativeReward.sum": { |
|
"value": 25.715199828147888, |
|
"min": -37.96260005235672, |
|
"max": 58.661200165748596, |
|
"count": 750 |
|
}, |
|
"SoccerTwos.IsTraining.mean": { |
|
"value": 1.0, |
|
"min": 1.0, |
|
"max": 1.0, |
|
"count": 750 |
|
}, |
|
"SoccerTwos.IsTraining.sum": { |
|
"value": 1.0, |
|
"min": 1.0, |
|
"max": 1.0, |
|
"count": 750 |
|
}, |
|
"SoccerTwos.Losses.PolicyLoss.mean": { |
|
"value": 0.013896760379429907, |
|
"min": 0.011988342530094087, |
|
"max": 0.02492272947759678, |
|
"count": 350 |
|
}, |
|
"SoccerTwos.Losses.PolicyLoss.sum": { |
|
"value": 0.013896760379429907, |
|
"min": 0.011988342530094087, |
|
"max": 0.02492272947759678, |
|
"count": 350 |
|
}, |
|
"SoccerTwos.Losses.ValueLoss.mean": { |
|
"value": 0.0895109735429287, |
|
"min": 3.223394425451905e-09, |
|
"max": 0.09912891238927841, |
|
"count": 350 |
|
}, |
|
"SoccerTwos.Losses.ValueLoss.sum": { |
|
"value": 0.0895109735429287, |
|
"min": 3.223394425451905e-09, |
|
"max": 0.09912891238927841, |
|
"count": 350 |
|
}, |
|
"SoccerTwos.Losses.BaselineLoss.mean": { |
|
"value": 0.09168058733145396, |
|
"min": 3.2062370462308347e-09, |
|
"max": 0.10227111205458642, |
|
"count": 350 |
|
}, |
|
"SoccerTwos.Losses.BaselineLoss.sum": { |
|
"value": 0.09168058733145396, |
|
"min": 3.2062370462308347e-09, |
|
"max": 0.10227111205458642, |
|
"count": 350 |
|
}, |
|
"SoccerTwos.Policy.LearningRate.mean": { |
|
"value": 0.0003, |
|
"min": 0.0003, |
|
"max": 0.0003, |
|
"count": 350 |
|
}, |
|
"SoccerTwos.Policy.LearningRate.sum": { |
|
"value": 0.0003, |
|
"min": 0.0003, |
|
"max": 0.0003, |
|
"count": 350 |
|
}, |
|
"SoccerTwos.Policy.Epsilon.mean": { |
|
"value": 0.20000000000000007, |
|
"min": 0.20000000000000007, |
|
"max": 0.20000000000000007, |
|
"count": 350 |
|
}, |
|
"SoccerTwos.Policy.Epsilon.sum": { |
|
"value": 0.20000000000000007, |
|
"min": 0.20000000000000007, |
|
"max": 0.20000000000000007, |
|
"count": 350 |
|
}, |
|
"SoccerTwos.Policy.Beta.mean": { |
|
"value": 0.005000000000000001, |
|
"min": 0.005000000000000001, |
|
"max": 0.005000000000000001, |
|
"count": 350 |
|
}, |
|
"SoccerTwos.Policy.Beta.sum": { |
|
"value": 0.005000000000000001, |
|
"min": 0.005000000000000001, |
|
"max": 0.005000000000000001, |
|
"count": 350 |
|
} |
|
}, |
|
"metadata": { |
|
"timer_format_version": "0.1.0", |
|
"start_time_seconds": "1675478238", |
|
"python_version": "3.8.16 (default, Jan 17 2023, 23:13:24) \n[GCC 11.2.0]", |
|
"command_line_arguments": "/home/keshan/miniconda3/envs/rl/bin/mlagents-learn ./config/poca/SoccerTwos.yaml --env=./training-envs-executables/SoccerTwos/SoccerTwos.x86_64 --run-id=SoccerTwos --no-graphics --force", |
|
"mlagents_version": "0.31.0.dev0", |
|
"mlagents_envs_version": "0.31.0.dev0", |
|
"communication_protocol_version": "1.5.0", |
|
"pytorch_version": "1.8.1+cu102", |
|
"numpy_version": "1.21.2", |
|
"end_time_seconds": "1675487805" |
|
}, |
|
"total": 9567.807344482, |
|
"count": 1, |
|
"self": 0.5436419460002071, |
|
"children": { |
|
"run_training.setup": { |
|
"total": 0.008059904999981882, |
|
"count": 1, |
|
"self": 0.008059904999981882 |
|
}, |
|
"TrainerController.start_learning": { |
|
"total": 9567.255642631, |
|
"count": 1, |
|
"self": 9.405608434972237, |
|
"children": { |
|
"TrainerController._reset_env": { |
|
"total": 4.7793283859953135, |
|
"count": 38, |
|
"self": 4.7793283859953135 |
|
}, |
|
"TrainerController.advance": { |
|
"total": 9552.876563591033, |
|
"count": 494663, |
|
"self": 9.747094787091555, |
|
"children": { |
|
"env_step": { |
|
"total": 6833.046095705896, |
|
"count": 494663, |
|
"self": 4830.561937479352, |
|
"children": { |
|
"SubprocessEnvManager._take_step": { |
|
"total": 1996.823041652454, |
|
"count": 494663, |
|
"self": 53.83810939587397, |
|
"children": { |
|
"TorchPolicy.evaluate": { |
|
"total": 1942.9849322565801, |
|
"count": 963856, |
|
"self": 1942.9849322565801 |
|
} |
|
} |
|
}, |
|
"workers": { |
|
"total": 5.661116574089419, |
|
"count": 494663, |
|
"self": 0.0, |
|
"children": { |
|
"worker_root": { |
|
"total": 9551.001550163073, |
|
"count": 494663, |
|
"is_parallel": true, |
|
"self": 5748.170677710079, |
|
"children": { |
|
"run_training.setup": { |
|
"total": 0.0, |
|
"count": 0, |
|
"is_parallel": true, |
|
"self": 0.0, |
|
"children": { |
|
"steps_from_proto": { |
|
"total": 0.0019828280001092935, |
|
"count": 2, |
|
"is_parallel": true, |
|
"self": 0.0007948390004912653, |
|
"children": { |
|
"_process_rank_one_or_two_observation": { |
|
"total": 0.0011879889996180282, |
|
"count": 8, |
|
"is_parallel": true, |
|
"self": 0.0011879889996180282 |
|
} |
|
} |
|
}, |
|
"UnityEnvironment.step": { |
|
"total": 0.017460377000020344, |
|
"count": 1, |
|
"is_parallel": true, |
|
"self": 0.00040050200004770886, |
|
"children": { |
|
"UnityEnvironment._generate_step_input": { |
|
"total": 0.0003641219999508394, |
|
"count": 1, |
|
"is_parallel": true, |
|
"self": 0.0003641219999508394 |
|
}, |
|
"communicator.exchange": { |
|
"total": 0.015327287999980399, |
|
"count": 1, |
|
"is_parallel": true, |
|
"self": 0.015327287999980399 |
|
}, |
|
"steps_from_proto": { |
|
"total": 0.0013684650000413967, |
|
"count": 2, |
|
"is_parallel": true, |
|
"self": 0.0002882799999497365, |
|
"children": { |
|
"_process_rank_one_or_two_observation": { |
|
"total": 0.0010801850000916602, |
|
"count": 8, |
|
"is_parallel": true, |
|
"self": 0.0010801850000916602 |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
}, |
|
"UnityEnvironment.step": { |
|
"total": 3802.782827069997, |
|
"count": 494662, |
|
"is_parallel": true, |
|
"self": 235.98976235914142, |
|
"children": { |
|
"UnityEnvironment._generate_step_input": { |
|
"total": 168.4696023440173, |
|
"count": 494662, |
|
"is_parallel": true, |
|
"self": 168.4696023440173 |
|
}, |
|
"communicator.exchange": { |
|
"total": 2696.776058992281, |
|
"count": 494662, |
|
"is_parallel": true, |
|
"self": 2696.776058992281 |
|
}, |
|
"steps_from_proto": { |
|
"total": 701.5474033745572, |
|
"count": 989324, |
|
"is_parallel": true, |
|
"self": 150.17200161879146, |
|
"children": { |
|
"_process_rank_one_or_two_observation": { |
|
"total": 551.3754017557658, |
|
"count": 3957296, |
|
"is_parallel": true, |
|
"self": 551.3754017557658 |
|
} |
|
} |
|
} |
|
} |
|
}, |
|
"steps_from_proto": { |
|
"total": 0.04804538299708838, |
|
"count": 74, |
|
"is_parallel": true, |
|
"self": 0.010409197989019958, |
|
"children": { |
|
"_process_rank_one_or_two_observation": { |
|
"total": 0.037636185008068423, |
|
"count": 296, |
|
"is_parallel": true, |
|
"self": 0.037636185008068423 |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
}, |
|
"trainer_advance": { |
|
"total": 2710.0833730980457, |
|
"count": 494663, |
|
"self": 63.375225928014515, |
|
"children": { |
|
"process_trajectory": { |
|
"total": 710.8399682470418, |
|
"count": 494663, |
|
"self": 706.4292853540411, |
|
"children": { |
|
"RLTrainer._checkpoint": { |
|
"total": 4.41068289300074, |
|
"count": 15, |
|
"self": 4.41068289300074 |
|
} |
|
} |
|
}, |
|
"_update_policy": { |
|
"total": 1935.8681789229895, |
|
"count": 350, |
|
"self": 816.7539139299679, |
|
"children": { |
|
"TorchPOCAOptimizer.update": { |
|
"total": 1119.1142649930216, |
|
"count": 10500, |
|
"self": 1119.1142649930216 |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
}, |
|
"trainer_threads": { |
|
"total": 5.410001904238015e-07, |
|
"count": 1, |
|
"self": 5.410001904238015e-07 |
|
}, |
|
"TrainerController._save_models": { |
|
"total": 0.1941416779991414, |
|
"count": 1, |
|
"self": 0.005221129998972174, |
|
"children": { |
|
"RLTrainer._checkpoint": { |
|
"total": 0.18892054800016922, |
|
"count": 1, |
|
"self": 0.18892054800016922 |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |