First push

e216770 verified about 1 year ago

18.7 kB

	{
	"name": "root",
	"gauges": {
	"Pyramids.Policy.Entropy.mean": {
	"value": 0.323770672082901,
	"min": 0.323770672082901,
	"max": 1.4582098722457886,
	"count": 33
	},
	"Pyramids.Policy.Entropy.sum": {
	"value": 9759.7431640625,
	"min": 9759.7431640625,
	"max": 44236.25390625,
	"count": 33
	},
	"Pyramids.Step.mean": {
	"value": 989895.0,
	"min": 29915.0,
	"max": 989895.0,
	"count": 33
	},
	"Pyramids.Step.sum": {
	"value": 989895.0,
	"min": 29915.0,
	"max": 989895.0,
	"count": 33
	},
	"Pyramids.Policy.ExtrinsicValueEstimate.mean": {
	"value": 0.49555015563964844,
	"min": -0.13686437904834747,
	"max": 0.6415801048278809,
	"count": 33
	},
	"Pyramids.Policy.ExtrinsicValueEstimate.sum": {
	"value": 130.8252410888672,
	"min": -32.57372283935547,
	"max": 181.56716918945312,
	"count": 33
	},
	"Pyramids.Policy.RndValueEstimate.mean": {
	"value": -0.011162635870277882,
	"min": -0.011162635870277882,
	"max": 0.26784929633140564,
	"count": 33
	},
	"Pyramids.Policy.RndValueEstimate.sum": {
	"value": -2.9469358921051025,
	"min": -2.9469358921051025,
	"max": 64.55168151855469,
	"count": 33
	},
	"Pyramids.Losses.PolicyLoss.mean": {
	"value": 0.06477152436143821,
	"min": 0.06477152436143821,
	"max": 0.07273734795738009,
	"count": 33
	},
	"Pyramids.Losses.PolicyLoss.sum": {
	"value": 0.9715728654215732,
	"min": 0.5766963413077729,
	"max": 1.0643582190021728,
	"count": 33
	},
	"Pyramids.Losses.ValueLoss.mean": {
	"value": 0.01423398255525778,
	"min": 0.0005055835248906022,
	"max": 0.015414487217833889,
	"count": 33
	},
	"Pyramids.Losses.ValueLoss.sum": {
	"value": 0.2135097383288667,
	"min": 0.006067002298687226,
	"max": 0.21986013003333937,
	"count": 33
	},
	"Pyramids.Policy.LearningRate.mean": {
	"value": 7.521337492920005e-06,
	"min": 7.521337492920005e-06,
	"max": 0.0002948502392165875,
	"count": 33
	},
	"Pyramids.Policy.LearningRate.sum": {
	"value": 0.00011282006239380008,
	"min": 0.00011282006239380008,
	"max": 0.003508413530528899,
	"count": 33
	},
	"Pyramids.Policy.Epsilon.mean": {
	"value": 0.10250708000000001,
	"min": 0.10250708000000001,
	"max": 0.1982834125,
	"count": 33
	},
	"Pyramids.Policy.Epsilon.sum": {
	"value": 1.5376062000000001,
	"min": 1.4776548,
	"max": 2.5694710999999995,
	"count": 33
	},
	"Pyramids.Policy.Beta.mean": {
	"value": 0.00026045729200000015,
	"min": 0.00026045729200000015,
	"max": 0.00982851290875,
	"count": 33
	},
	"Pyramids.Policy.Beta.sum": {
	"value": 0.003906859380000002,
	"min": 0.003906859380000002,
	"max": 0.11697016289000002,
	"count": 33
	},
	"Pyramids.Losses.RNDLoss.mean": {
	"value": 0.01812346652150154,
	"min": 0.01812346652150154,
	"max": 0.4680212736129761,
	"count": 33
	},
	"Pyramids.Losses.RNDLoss.sum": {
	"value": 0.2718519866466522,
	"min": 0.2669598162174225,
	"max": 3.7441701889038086,
	"count": 33
	},
	"Pyramids.Environment.EpisodeLength.mean": {
	"value": 389.17283950617286,
	"min": 336.96774193548384,
	"max": 999.0,
	"count": 33
	},
	"Pyramids.Environment.EpisodeLength.sum": {
	"value": 31523.0,
	"min": 16969.0,
	"max": 32699.0,
	"count": 33
	},
	"Pyramids.Environment.CumulativeReward.mean": {
	"value": 1.4132493548555138,
	"min": -0.9999500517733395,
	"max": 1.571856159172701,
	"count": 33
	},
	"Pyramids.Environment.CumulativeReward.sum": {
	"value": 114.47319774329662,
	"min": -31.998401656746864,
	"max": 144.65899857878685,
	"count": 33
	},
	"Pyramids.Policy.ExtrinsicReward.mean": {
	"value": 1.4132493548555138,
	"min": -0.9999500517733395,
	"max": 1.571856159172701,
	"count": 33
	},
	"Pyramids.Policy.ExtrinsicReward.sum": {
	"value": 114.47319774329662,
	"min": -31.998401656746864,
	"max": 144.65899857878685,
	"count": 33
	},
	"Pyramids.Policy.RndReward.mean": {
	"value": 0.07258195938962156,
	"min": 0.06830586166168222,
	"max": 8.162659615278244,
	"count": 33
	},
	"Pyramids.Policy.RndReward.sum": {
	"value": 5.879138710559346,
	"min": 5.396163071272895,
	"max": 146.9278730750084,
	"count": 33
	},
	"Pyramids.IsTraining.mean": {
	"value": 1.0,
	"min": 1.0,
	"max": 1.0,
	"count": 33
	},
	"Pyramids.IsTraining.sum": {
	"value": 1.0,
	"min": 1.0,
	"max": 1.0,
	"count": 33
	}
	},
	"metadata": {
	"timer_format_version": "0.1.0",
	"start_time_seconds": "1738450332",
	"python_version": "3.10.12 (main, Jul 5 2023, 18:54:27) [GCC 11.2.0]",
	"command_line_arguments": "/usr/local/bin/mlagents-learn ./config/ppo/PyramidsRND.yaml --env=./training-envs-executables/linux/Pyramids/Pyramids --run-id=Pyramids Training --no-graphics",
	"mlagents_version": "1.2.0.dev0",
	"mlagents_envs_version": "1.2.0.dev0",
	"communication_protocol_version": "1.5.0",
	"pytorch_version": "2.6.0+cu124",
	"numpy_version": "1.23.5",
	"end_time_seconds": "1738452704"
	},
	"total": 2371.3287003059995,
	"count": 1,
	"self": 0.5264948510002796,
	"children": {
	"run_training.setup": {
	"total": 0.030683930999657605,
	"count": 1,
	"self": 0.030683930999657605
	},
	"TrainerController.start_learning": {
	"total": 2370.7715215239996,
	"count": 1,
	"self": 1.481143858023188,
	"children": {
	"TrainerController._reset_env": {
	"total": 2.244592248999652,
	"count": 1,
	"self": 2.244592248999652
	},
	"TrainerController.advance": {
	"total": 2366.951290260977,
	"count": 63824,
	"self": 1.5431029529468105,
	"children": {
	"env_step": {
	"total": 1648.2647548129257,
	"count": 63824,
	"self": 1479.8927231679654,
	"children": {
	"SubprocessEnvManager._take_step": {
	"total": 167.49660390002782,
	"count": 63824,
	"self": 5.003764071965179,
	"children": {
	"TorchPolicy.evaluate": {
	"total": 162.49283982806264,
	"count": 62557,
	"self": 162.49283982806264
	}
	}
	},
	"workers": {
	"total": 0.8754277449324945,
	"count": 63824,
	"self": 0.0,
	"children": {
	"worker_root": {
	"total": 2365.041919946991,
	"count": 63824,
	"is_parallel": true,
	"self": 1008.47313007404,
	"children": {
	"run_training.setup": {
	"total": 0.0,
	"count": 0,
	"is_parallel": true,
	"self": 0.0,
	"children": {
	"steps_from_proto": {
	"total": 0.002063453999653575,
	"count": 1,
	"is_parallel": true,
	"self": 0.0006883389992253797,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 0.0013751150004281953,
	"count": 8,
	"is_parallel": true,
	"self": 0.0013751150004281953
	}
	}
	},
	"UnityEnvironment.step": {
	"total": 0.052112123999904725,
	"count": 1,
	"is_parallel": true,
	"self": 0.0005389189996094501,
	"children": {
	"UnityEnvironment._generate_step_input": {
	"total": 0.0007047650001368311,
	"count": 1,
	"is_parallel": true,
	"self": 0.0007047650001368311
	},
	"communicator.exchange": {
	"total": 0.04913821300033305,
	"count": 1,
	"is_parallel": true,
	"self": 0.04913821300033305
	},
	"steps_from_proto": {
	"total": 0.0017302269998253905,
	"count": 1,
	"is_parallel": true,
	"self": 0.00035096299961878685,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 0.0013792640002066037,
	"count": 8,
	"is_parallel": true,
	"self": 0.0013792640002066037
	}
	}
	}
	}
	}
	}
	},
	"UnityEnvironment.step": {
	"total": 1356.5687898729511,
	"count": 63823,
	"is_parallel": true,
	"self": 33.35161664508223,
	"children": {
	"UnityEnvironment._generate_step_input": {
	"total": 24.426625246936965,
	"count": 63823,
	"is_parallel": true,
	"self": 24.426625246936965
	},
	"communicator.exchange": {
	"total": 1195.464377916011,
	"count": 63823,
	"is_parallel": true,
	"self": 1195.464377916011
	},
	"steps_from_proto": {
	"total": 103.32617006492092,
	"count": 63823,
	"is_parallel": true,
	"self": 20.968925834036327,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 82.35724423088459,
	"count": 510584,
	"is_parallel": true,
	"self": 82.35724423088459
	}
	}
	}
	}
	}
	}
	}
	}
	}
	}
	},
	"trainer_advance": {
	"total": 717.1434324951047,
	"count": 63824,
	"self": 2.8409659511489735,
	"children": {
	"process_trajectory": {
	"total": 139.40505516995745,
	"count": 63824,
	"self": 139.19528470095793,
	"children": {
	"RLTrainer._checkpoint": {
	"total": 0.20977046899952256,
	"count": 2,
	"self": 0.20977046899952256
	}
	}
	},
	"_update_policy": {
	"total": 574.8974113739982,
	"count": 456,
	"self": 316.4368406340377,
	"children": {
	"TorchPPOOptimizer.update": {
	"total": 258.46057073996053,
	"count": 22773,
	"self": 258.46057073996053
	}
	}
	}
	}
	}
	}
	},
	"trainer_threads": {
	"total": 1.1829997674794868e-06,
	"count": 1,
	"self": 1.1829997674794868e-06
	},
	"TrainerController._save_models": {
	"total": 0.09449397299977136,
	"count": 1,
	"self": 0.0014072179992581368,
	"children": {
	"RLTrainer._checkpoint": {
	"total": 0.09308675500051322,
	"count": 1,
	"self": 0.09308675500051322
	}
	}
	}
	}
	}
	}
	}