First Push

0cb907a about 1 year ago

20.3 kB

	{
	"name": "root",
	"gauges": {
	"SoccerTwos.Policy.Entropy.mean": {
	"value": 1.5969356298446655,
	"min": 1.5406135320663452,
	"max": 3.2957420349121094,
	"count": 1000
	},
	"SoccerTwos.Policy.Entropy.sum": {
	"value": 32807.4453125,
	"min": 22233.03515625,
	"max": 119406.3984375,
	"count": 1000
	},
	"SoccerTwos.Environment.EpisodeLength.mean": {
	"value": 52.81720430107527,
	"min": 40.56198347107438,
	"max": 999.0,
	"count": 1000
	},
	"SoccerTwos.Environment.EpisodeLength.sum": {
	"value": 19648.0,
	"min": 14076.0,
	"max": 23844.0,
	"count": 1000
	},
	"SoccerTwos.Self-play.ELO.mean": {
	"value": 1555.4992597326595,
	"min": 1190.120050817967,
	"max": 1604.2552553318303,
	"count": 992
	},
	"SoccerTwos.Self-play.ELO.sum": {
	"value": 289322.8623102747,
	"min": 2394.009544151198,
	"max": 379028.06362600107,
	"count": 992
	},
	"SoccerTwos.Step.mean": {
	"value": 9999972.0,
	"min": 9174.0,
	"max": 9999972.0,
	"count": 1000
	},
	"SoccerTwos.Step.sum": {
	"value": 9999972.0,
	"min": 9174.0,
	"max": 9999972.0,
	"count": 1000
	},
	"SoccerTwos.Policy.ExtrinsicBaselineEstimate.mean": {
	"value": -0.014413188211619854,
	"min": -0.12347006052732468,
	"max": 0.12490702420473099,
	"count": 1000
	},
	"SoccerTwos.Policy.ExtrinsicBaselineEstimate.sum": {
	"value": -2.6664397716522217,
	"min": -24.955711364746094,
	"max": 17.15989875793457,
	"count": 1000
	},
	"SoccerTwos.Policy.ExtrinsicValueEstimate.mean": {
	"value": -0.010898062027990818,
	"min": -0.12485354393720627,
	"max": 0.12470623850822449,
	"count": 1000
	},
	"SoccerTwos.Policy.ExtrinsicValueEstimate.sum": {
	"value": -2.016141414642334,
	"min": -24.727825164794922,
	"max": 16.87221908569336,
	"count": 1000
	},
	"SoccerTwos.Environment.CumulativeReward.mean": {
	"value": 0.0,
	"min": 0.0,
	"max": 0.0,
	"count": 1000
	},
	"SoccerTwos.Environment.CumulativeReward.sum": {
	"value": 0.0,
	"min": 0.0,
	"max": 0.0,
	"count": 1000
	},
	"SoccerTwos.Policy.ExtrinsicReward.mean": {
	"value": 0.13524540566109322,
	"min": -0.5605333337077388,
	"max": 0.41887500137090683,
	"count": 1000
	},
	"SoccerTwos.Policy.ExtrinsicReward.sum": {
	"value": 25.020400047302246,
	"min": -56.325600147247314,
	"max": 54.54360020160675,
	"count": 1000
	},
	"SoccerTwos.Environment.GroupCumulativeReward.mean": {
	"value": 0.13524540566109322,
	"min": -0.5605333337077388,
	"max": 0.41887500137090683,
	"count": 1000
	},
	"SoccerTwos.Environment.GroupCumulativeReward.sum": {
	"value": 25.020400047302246,
	"min": -56.325600147247314,
	"max": 54.54360020160675,
	"count": 1000
	},
	"SoccerTwos.IsTraining.mean": {
	"value": 1.0,
	"min": 1.0,
	"max": 1.0,
	"count": 1000
	},
	"SoccerTwos.IsTraining.sum": {
	"value": 1.0,
	"min": 1.0,
	"max": 1.0,
	"count": 1000
	},
	"SoccerTwos.Losses.PolicyLoss.mean": {
	"value": 0.02141846805801227,
	"min": 0.010343785071745515,
	"max": 0.02435030248016119,
	"count": 482
	},
	"SoccerTwos.Losses.PolicyLoss.sum": {
	"value": 0.02141846805801227,
	"min": 0.010343785071745515,
	"max": 0.02435030248016119,
	"count": 482
	},
	"SoccerTwos.Losses.ValueLoss.mean": {
	"value": 0.10125019202629724,
	"min": 0.00030965355545049534,
	"max": 0.12248869289954503,
	"count": 482
	},
	"SoccerTwos.Losses.ValueLoss.sum": {
	"value": 0.10125019202629724,
	"min": 0.00030965355545049534,
	"max": 0.12248869289954503,
	"count": 482
	},
	"SoccerTwos.Losses.BaselineLoss.mean": {
	"value": 0.10259012083212535,
	"min": 0.00030871983423518635,
	"max": 0.12475258807341258,
	"count": 482
	},
	"SoccerTwos.Losses.BaselineLoss.sum": {
	"value": 0.10259012083212535,
	"min": 0.00030871983423518635,
	"max": 0.12475258807341258,
	"count": 482
	},
	"SoccerTwos.Policy.LearningRate.mean": {
	"value": 0.0003,
	"min": 0.0003,
	"max": 0.0003,
	"count": 482
	},
	"SoccerTwos.Policy.LearningRate.sum": {
	"value": 0.0003,
	"min": 0.0003,
	"max": 0.0003,
	"count": 482
	},
	"SoccerTwos.Policy.Epsilon.mean": {
	"value": 0.20000000000000007,
	"min": 0.20000000000000007,
	"max": 0.20000000000000007,
	"count": 482
	},
	"SoccerTwos.Policy.Epsilon.sum": {
	"value": 0.20000000000000007,
	"min": 0.20000000000000007,
	"max": 0.20000000000000007,
	"count": 482
	},
	"SoccerTwos.Policy.Beta.mean": {
	"value": 0.005000000000000001,
	"min": 0.005000000000000001,
	"max": 0.005000000000000001,
	"count": 482
	},
	"SoccerTwos.Policy.Beta.sum": {
	"value": 0.005000000000000001,
	"min": 0.005000000000000001,
	"max": 0.005000000000000001,
	"count": 482
	}
	},
	"metadata": {
	"timer_format_version": "0.1.0",
	"start_time_seconds": "1694708790",
	"python_version": "3.9.18 \| packaged by conda-forge \| (main, Aug 30 2023, 03:49:32) \n[GCC 12.3.0]",
	"command_line_arguments": "/home/terps/mambaforge/envs/rl/bin/mlagents-learn ./config/poca/SoccerTwos.yaml --env=./training-envs-executables/SoccerTwos/SoccerTwos.x86_64 --run-id=SoccerTwos --no-graphics --force",
	"mlagents_version": "0.31.0.dev0",
	"mlagents_envs_version": "0.31.0.dev0",
	"communication_protocol_version": "1.5.0",
	"pytorch_version": "1.11.0+cu102",
	"numpy_version": "1.21.2",
	"end_time_seconds": "1694736508"
	},
	"total": 27718.452107893998,
	"count": 1,
	"self": 1.7995216749986866,
	"children": {
	"run_training.setup": {
	"total": 0.012232699999003671,
	"count": 1,
	"self": 0.012232699999003671
	},
	"TrainerController.start_learning": {
	"total": 27716.640353519,
	"count": 1,
	"self": 19.2576742155361,
	"children": {
	"TrainerController._reset_env": {
	"total": 8.84835274298166,
	"count": 21,
	"self": 8.84835274298166
	},
	"TrainerController.advance": {
	"total": 27688.247795048483,
	"count": 680429,
	"self": 19.05893027050115,
	"children": {
	"env_step": {
	"total": 22157.30852160375,
	"count": 680429,
	"self": 15638.15256235451,
	"children": {
	"SubprocessEnvManager._take_step": {
	"total": 6507.746948996195,
	"count": 680429,
	"self": 113.61552996908722,
	"children": {
	"TorchPolicy.evaluate": {
	"total": 6394.131419027108,
	"count": 1254764,
	"self": 6394.131419027108
	}
	}
	},
	"workers": {
	"total": 11.40901025304629,
	"count": 680428,
	"self": 0.0,
	"children": {
	"worker_root": {
	"total": 27672.763382924164,
	"count": 680428,
	"is_parallel": true,
	"self": 14029.47554577728,
	"children": {
	"run_training.setup": {
	"total": 0.0,
	"count": 0,
	"is_parallel": true,
	"self": 0.0,
	"children": {
	"steps_from_proto": {
	"total": 0.007280599998921389,
	"count": 2,
	"is_parallel": true,
	"self": 0.005340200004866347,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 0.001940399994055042,
	"count": 8,
	"is_parallel": true,
	"self": 0.001940399994055042
	}
	}
	},
	"UnityEnvironment.step": {
	"total": 0.03416270000161603,
	"count": 1,
	"is_parallel": true,
	"self": 0.0006320999964373186,
	"children": {
	"UnityEnvironment._generate_step_input": {
	"total": 0.0005296000017551705,
	"count": 1,
	"is_parallel": true,
	"self": 0.0005296000017551705
	},
	"communicator.exchange": {
	"total": 0.031072600002516992,
	"count": 1,
	"is_parallel": true,
	"self": 0.031072600002516992
	},
	"steps_from_proto": {
	"total": 0.0019284000009065494,
	"count": 2,
	"is_parallel": true,
	"self": 0.00048099999912665226,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 0.0014474000017798971,
	"count": 8,
	"is_parallel": true,
	"self": 0.0014474000017798971
	}
	}
	}
	}
	}
	}
	},
	"UnityEnvironment.step": {
	"total": 13643.25105359788,
	"count": 680427,
	"is_parallel": true,
	"self": 402.79831428049874,
	"children": {
	"UnityEnvironment._generate_step_input": {
	"total": 276.44210654751805,
	"count": 680427,
	"is_parallel": true,
	"self": 276.44210654751805
	},
	"communicator.exchange": {
	"total": 11742.215522667906,
	"count": 680427,
	"is_parallel": true,
	"self": 11742.215522667906
	},
	"steps_from_proto": {
	"total": 1221.795110101957,
	"count": 1360854,
	"is_parallel": true,
	"self": 273.6090259386874,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 948.1860841632697,
	"count": 5443416,
	"is_parallel": true,
	"self": 948.1860841632697
	}
	}
	}
	}
	},
	"steps_from_proto": {
	"total": 0.03678354900330305,
	"count": 40,
	"is_parallel": true,
	"self": 0.008402747000218369,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 0.028380802003084682,
	"count": 160,
	"is_parallel": true,
	"self": 0.028380802003084682
	}
	}
	}
	}
	}
	}
	}
	}
	},
	"trainer_advance": {
	"total": 5511.880343174231,
	"count": 680428,
	"self": 128.80195408420332,
	"children": {
	"process_trajectory": {
	"total": 2575.0881813440137,
	"count": 680428,
	"self": 2568.601877004996,
	"children": {
	"RLTrainer._checkpoint": {
	"total": 6.486304339017806,
	"count": 20,
	"self": 6.486304339017806
	}
	}
	},
	"_update_policy": {
	"total": 2807.9902077460138,
	"count": 483,
	"self": 1697.4578579989175,
	"children": {
	"TorchPOCAOptimizer.update": {
	"total": 1110.5323497470963,
	"count": 14490,
	"self": 1110.5323497470963
	}
	}
	}
	}
	}
	}
	},
	"trainer_threads": {
	"total": 1.5999976312741637e-06,
	"count": 1,
	"self": 1.5999976312741637e-06
	},
	"TrainerController._save_models": {
	"total": 0.28652991200215183,
	"count": 1,
	"self": 0.002179615003115032,
	"children": {
	"RLTrainer._checkpoint": {
	"total": 0.2843502969990368,
	"count": 1,
	"self": 0.2843502969990368
	}
	}
	}
	}
	}
	}
	}