First Push

628a0a5 verified 2 months ago

18.8 kB

	{
	"name": "root",
	"gauges": {
	"Pyramids.Policy.Entropy.mean": {
	"value": 0.15419848263263702,
	"min": 0.13651002943515778,
	"max": 0.823553740978241,
	"count": 80
	},
	"Pyramids.Policy.Entropy.sum": {
	"value": 4633.35595703125,
	"min": 3663.1669921875,
	"max": 24707.591796875,
	"count": 80
	},
	"Pyramids.Environment.EpisodeLength.mean": {
	"value": 214.79136690647482,
	"min": 138.16666666666666,
	"max": 489.51666666666665,
	"count": 80
	},
	"Pyramids.Environment.EpisodeLength.sum": {
	"value": 29856.0,
	"min": 829.0,
	"max": 31776.0,
	"count": 80
	},
	"Pyramids.Step.mean": {
	"value": 2999909.0,
	"min": 629931.0,
	"max": 2999909.0,
	"count": 80
	},
	"Pyramids.Step.sum": {
	"value": 2999909.0,
	"min": 629931.0,
	"max": 2999909.0,
	"count": 80
	},
	"Pyramids.Policy.ExtrinsicValueEstimate.mean": {
	"value": 0.8359577655792236,
	"min": 0.25308457016944885,
	"max": 0.8370456695556641,
	"count": 80
	},
	"Pyramids.Policy.ExtrinsicValueEstimate.sum": {
	"value": 248.27944946289062,
	"min": 8.604875564575195,
	"max": 252.99343872070312,
	"count": 80
	},
	"Pyramids.Policy.RndValueEstimate.mean": {
	"value": 0.005533040966838598,
	"min": -0.01403752900660038,
	"max": 0.024144239723682404,
	"count": 80
	},
	"Pyramids.Policy.RndValueEstimate.sum": {
	"value": 1.6433131694793701,
	"min": -4.028770923614502,
	"max": 6.905252456665039,
	"count": 80
	},
	"Pyramids.Environment.CumulativeReward.mean": {
	"value": 1.7708172537654423,
	"min": 1.410446641842524,
	"max": 1.8618333041667938,
	"count": 80
	},
	"Pyramids.Environment.CumulativeReward.sum": {
	"value": 246.1435982733965,
	"min": 11.170999825000763,
	"max": 246.1435982733965,
	"count": 80
	},
	"Pyramids.Policy.ExtrinsicReward.mean": {
	"value": 1.7708172537654423,
	"min": 1.410446641842524,
	"max": 1.8618333041667938,
	"count": 80
	},
	"Pyramids.Policy.ExtrinsicReward.sum": {
	"value": 246.1435982733965,
	"min": 11.170999825000763,
	"max": 246.1435982733965,
	"count": 80
	},
	"Pyramids.Policy.RndReward.mean": {
	"value": 0.016907050741648826,
	"min": 0.014792351323800782,
	"max": 0.044656114225896694,
	"count": 80
	},
	"Pyramids.Policy.RndReward.sum": {
	"value": 2.3500800530891865,
	"min": 0.0887541079428047,
	"max": 2.9113981585251167,
	"count": 80
	},
	"Pyramids.Losses.PolicyLoss.mean": {
	"value": 0.06731645511844814,
	"min": 0.06449578986689057,
	"max": 0.07284202956153811,
	"count": 80
	},
	"Pyramids.Losses.PolicyLoss.sum": {
	"value": 0.9424303716582739,
	"min": 0.06511365686310455,
	"max": 1.060511664133325,
	"count": 80
	},
	"Pyramids.Losses.ValueLoss.mean": {
	"value": 0.015762173018168138,
	"min": 0.007312449966169273,
	"max": 0.016672092985356272,
	"count": 80
	},
	"Pyramids.Losses.ValueLoss.sum": {
	"value": 0.22067042225435393,
	"min": 0.007312449966169273,
	"max": 0.24920289873261936,
	"count": 80
	},
	"Pyramids.Policy.LearningRate.mean": {
	"value": 1.4407423769285715e-06,
	"min": 1.4407423769285715e-06,
	"max": 0.00023719272093576668,
	"count": 80
	},
	"Pyramids.Policy.LearningRate.sum": {
	"value": 2.0170393277e-05,
	"min": 2.0170393277e-05,
	"max": 0.0035325708224765,
	"count": 80
	},
	"Pyramids.Policy.Epsilon.mean": {
	"value": 0.10048021428571428,
	"min": 0.10048021428571428,
	"max": 0.17906423333333335,
	"count": 80
	},
	"Pyramids.Policy.Epsilon.sum": {
	"value": 1.406723,
	"min": 0.17906423333333335,
	"max": 2.6775235000000004,
	"count": 80
	},
	"Pyramids.Policy.Beta.mean": {
	"value": 5.797340714285716e-05,
	"min": 5.797340714285716e-05,
	"max": 0.007908516909999998,
	"count": 80
	},
	"Pyramids.Policy.Beta.sum": {
	"value": 0.0008116277000000002,
	"min": 0.0008116277000000002,
	"max": 0.11778459765000002,
	"count": 80
	},
	"Pyramids.Losses.RNDLoss.mean": {
	"value": 0.0075660645961761475,
	"min": 0.007331254426389933,
	"max": 0.009189439006149769,
	"count": 80
	},
	"Pyramids.Losses.RNDLoss.sum": {
	"value": 0.10592490434646606,
	"min": 0.008900578133761883,
	"max": 0.1329563856124878,
	"count": 80
	},
	"Pyramids.IsTraining.mean": {
	"value": 1.0,
	"min": 1.0,
	"max": 1.0,
	"count": 80
	},
	"Pyramids.IsTraining.sum": {
	"value": 1.0,
	"min": 1.0,
	"max": 1.0,
	"count": 80
	}
	},
	"metadata": {
	"timer_format_version": "0.1.0",
	"start_time_seconds": "1726695630",
	"python_version": "3.10.12 (main, Sep 11 2024, 15:47:36) [GCC 11.4.0]",
	"command_line_arguments": "/usr/local/bin/mlagents-learn ./config/ppo/PyramidsRND.yaml --resume --env=./training-envs-executables/linux/Pyramids/Pyramids --run-id=Pyramids Training --no-graphics",
	"mlagents_version": "1.1.0.dev0",
	"mlagents_envs_version": "1.1.0.dev0",
	"communication_protocol_version": "1.5.0",
	"pytorch_version": "2.4.0+cu121",
	"numpy_version": "1.23.5",
	"end_time_seconds": "1726704165"
	},
	"total": 8535.375619375,
	"count": 1,
	"self": 0.7452478820014221,
	"children": {
	"run_training.setup": {
	"total": 0.08237167299967041,
	"count": 1,
	"self": 0.08237167299967041
	},
	"TrainerController.start_learning": {
	"total": 8534.547999819999,
	"count": 1,
	"self": 6.145169671061012,
	"children": {
	"TrainerController._reset_env": {
	"total": 3.3979853539999567,
	"count": 1,
	"self": 3.3979853539999567
	},
	"TrainerController.advance": {
	"total": 8524.909182714937,
	"count": 155171,
	"self": 6.299874070782607,
	"children": {
	"env_step": {
	"total": 5955.887078486949,
	"count": 155171,
	"self": 5576.892458963869,
	"children": {
	"SubprocessEnvManager._take_step": {
	"total": 375.4418779521029,
	"count": 155171,
	"self": 18.163601917177402,
	"children": {
	"TorchPolicy.evaluate": {
	"total": 357.2782760349255,
	"count": 148435,
	"self": 357.2782760349255
	}
	}
	},
	"workers": {
	"total": 3.55274157097665,
	"count": 155171,
	"self": 0.0,
	"children": {
	"worker_root": {
	"total": 8515.977976790391,
	"count": 155171,
	"is_parallel": true,
	"self": 3398.8017618879967,
	"children": {
	"run_training.setup": {
	"total": 0.0,
	"count": 0,
	"is_parallel": true,
	"self": 0.0,
	"children": {
	"steps_from_proto": {
	"total": 0.003266829000040161,
	"count": 1,
	"is_parallel": true,
	"self": 0.001071900000624737,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 0.002194928999415424,
	"count": 8,
	"is_parallel": true,
	"self": 0.002194928999415424
	}
	}
	},
	"UnityEnvironment.step": {
	"total": 0.06434809599977598,
	"count": 1,
	"is_parallel": true,
	"self": 0.0008171239992407209,
	"children": {
	"UnityEnvironment._generate_step_input": {
	"total": 0.0004978870001650648,
	"count": 1,
	"is_parallel": true,
	"self": 0.0004978870001650648
	},
	"communicator.exchange": {
	"total": 0.060996758000328555,
	"count": 1,
	"is_parallel": true,
	"self": 0.060996758000328555
	},
	"steps_from_proto": {
	"total": 0.002036327000041638,
	"count": 1,
	"is_parallel": true,
	"self": 0.00041612399991208804,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 0.0016202030001295498,
	"count": 8,
	"is_parallel": true,
	"self": 0.0016202030001295498
	}
	}
	}
	}
	}
	}
	},
	"UnityEnvironment.step": {
	"total": 5117.176214902394,
	"count": 155170,
	"is_parallel": true,
	"self": 120.9194205134263,
	"children": {
	"UnityEnvironment._generate_step_input": {
	"total": 72.63085866806523,
	"count": 155170,
	"is_parallel": true,
	"self": 72.63085866806523
	},
	"communicator.exchange": {
	"total": 4615.281839628038,
	"count": 155170,
	"is_parallel": true,
	"self": 4615.281839628038
	},
	"steps_from_proto": {
	"total": 308.34409609286513,
	"count": 155170,
	"is_parallel": true,
	"self": 68.52710665787299,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 239.81698943499214,
	"count": 1241360,
	"is_parallel": true,
	"self": 239.81698943499214
	}
	}
	}
	}
	}
	}
	}
	}
	}
	}
	},
	"trainer_advance": {
	"total": 2562.7222301572065,
	"count": 155171,
	"self": 12.20619110042071,
	"children": {
	"process_trajectory": {
	"total": 410.9088252297897,
	"count": 155171,
	"self": 410.3971786137881,
	"children": {
	"RLTrainer._checkpoint": {
	"total": 0.5116466160015989,
	"count": 5,
	"self": 0.5116466160015989
	}
	}
	},
	"_update_policy": {
	"total": 2139.607213826996,
	"count": 1124,
	"self": 857.109888902974,
	"children": {
	"TorchPPOOptimizer.update": {
	"total": 1282.497324924022,
	"count": 54069,
	"self": 1282.497324924022
	}
	}
	}
	}
	}
	}
	},
	"trainer_threads": {
	"total": 1.2420005077729002e-06,
	"count": 1,
	"self": 1.2420005077729002e-06
	},
	"TrainerController._save_models": {
	"total": 0.09566083800018532,
	"count": 1,
	"self": 0.0034099340009561274,
	"children": {
	"RLTrainer._checkpoint": {
	"total": 0.0922509039992292,
	"count": 1,
	"self": 0.0922509039992292
	}
	}
	}
	}
	}
	}
	}