First Push

7c04eac verified 9 months ago

18.7 kB

	{
	"name": "root",
	"gauges": {
	"Pyramids.Policy.Entropy.mean": {
	"value": 0.1700698733329773,
	"min": 0.15845796465873718,
	"max": 0.26031944155693054,
	"count": 28
	},
	"Pyramids.Policy.Entropy.sum": {
	"value": 5161.9609375,
	"min": 1016.287109375,
	"max": 7826.34375,
	"count": 28
	},
	"Pyramids.Environment.EpisodeLength.mean": {
	"value": 207.768115942029,
	"min": 175.07692307692307,
	"max": 271.4117647058824,
	"count": 28
	},
	"Pyramids.Environment.EpisodeLength.sum": {
	"value": 28672.0,
	"min": 2276.0,
	"max": 32298.0,
	"count": 28
	},
	"Pyramids.Step.mean": {
	"value": 2489948.0,
	"min": 1679960.0,
	"max": 2489948.0,
	"count": 28
	},
	"Pyramids.Step.sum": {
	"value": 2489948.0,
	"min": 1679960.0,
	"max": 2489948.0,
	"count": 28
	},
	"Pyramids.Policy.ExtrinsicValueEstimate.mean": {
	"value": 0.9037383794784546,
	"min": 0.6263155341148376,
	"max": 0.9037383794784546,
	"count": 28
	},
	"Pyramids.Policy.ExtrinsicValueEstimate.sum": {
	"value": 273.8327331542969,
	"min": 17.536834716796875,
	"max": 273.8327331542969,
	"count": 28
	},
	"Pyramids.Policy.RndValueEstimate.mean": {
	"value": 0.0044550965540111065,
	"min": -0.002209288766607642,
	"max": 0.046209245920181274,
	"count": 28
	},
	"Pyramids.Policy.RndValueEstimate.sum": {
	"value": 1.3498942852020264,
	"min": -0.6451123356819153,
	"max": 13.90898323059082,
	"count": 28
	},
	"Pyramids.Environment.CumulativeReward.mean": {
	"value": 1.7777376668392748,
	"min": 1.6613411556522386,
	"max": 1.8249230568225567,
	"count": 28
	},
	"Pyramids.Environment.CumulativeReward.sum": {
	"value": 245.32779802381992,
	"min": 23.723999738693237,
	"max": 252.7247984930873,
	"count": 28
	},
	"Pyramids.Policy.ExtrinsicReward.mean": {
	"value": 1.7777376668392748,
	"min": 1.6613411556522386,
	"max": 1.8249230568225567,
	"count": 28
	},
	"Pyramids.Policy.ExtrinsicReward.sum": {
	"value": 245.32779802381992,
	"min": 23.723999738693237,
	"max": 252.7247984930873,
	"count": 28
	},
	"Pyramids.Policy.RndReward.mean": {
	"value": 0.011585179078858768,
	"min": 0.011585179078858768,
	"max": 0.01712447010917674,
	"count": 28
	},
	"Pyramids.Policy.RndReward.sum": {
	"value": 1.59875471288251,
	"min": 0.16541378060355783,
	"max": 2.061749845990562,
	"count": 28
	},
	"Pyramids.Losses.PolicyLoss.mean": {
	"value": 0.06791332284670457,
	"min": 0.06540743341627538,
	"max": 0.0716755648241988,
	"count": 28
	},
	"Pyramids.Losses.PolicyLoss.sum": {
	"value": 0.950786519853864,
	"min": 0.06915688141210315,
	"max": 1.0671006890382462,
	"count": 28
	},
	"Pyramids.Losses.ValueLoss.mean": {
	"value": 0.012159144297280971,
	"min": 0.011192417538647229,
	"max": 0.01619531853343471,
	"count": 28
	},
	"Pyramids.Losses.ValueLoss.sum": {
	"value": 0.17022802016193359,
	"min": 0.011192417538647229,
	"max": 0.23043314945243767,
	"count": 28
	},
	"Pyramids.Policy.LearningRate.mean": {
	"value": 5.244986108816905e-05,
	"min": 5.244986108816905e-05,
	"max": 0.0001321056559648,
	"count": 28
	},
	"Pyramids.Policy.LearningRate.sum": {
	"value": 0.0007342980552343667,
	"min": 0.0001321056559648,
	"max": 0.0018678535773824336,
	"count": 28
	},
	"Pyramids.Policy.Epsilon.mean": {
	"value": 0.11748325952380953,
	"min": 0.11748325952380953,
	"max": 0.1440352,
	"count": 28
	},
	"Pyramids.Policy.Epsilon.sum": {
	"value": 1.6447656333333334,
	"min": 0.1440352,
	"max": 2.1226175666666665,
	"count": 28
	},
	"Pyramids.Policy.Beta.mean": {
	"value": 0.0017565776264285714,
	"min": 0.0017565776264285714,
	"max": 0.004409116479999999,
	"count": 28
	},
	"Pyramids.Policy.Beta.sum": {
	"value": 0.02459208677,
	"min": 0.004409116479999999,
	"max": 0.062349494910000004,
	"count": 28
	},
	"Pyramids.Losses.RNDLoss.mean": {
	"value": 0.005485209170728922,
	"min": 0.005394092295318842,
	"max": 0.006814947817474604,
	"count": 28
	},
	"Pyramids.Losses.RNDLoss.sum": {
	"value": 0.07679292559623718,
	"min": 0.006814947817474604,
	"max": 0.09431394934654236,
	"count": 28
	},
	"Pyramids.IsTraining.mean": {
	"value": 1.0,
	"min": 1.0,
	"max": 1.0,
	"count": 28
	},
	"Pyramids.IsTraining.sum": {
	"value": 1.0,
	"min": 1.0,
	"max": 1.0,
	"count": 28
	}
	},
	"metadata": {
	"timer_format_version": "0.1.0",
	"start_time_seconds": "1752607676",
	"python_version": "3.10.12 (main, Jul 5 2023, 18:54:27) [GCC 11.2.0]",
	"command_line_arguments": "/usr/local/bin/mlagents-learn ./config/ppo/PyramidsRND.yaml --env=./training-envs-executables/linux/Pyramids/Pyramids --run-id=Pyramids Training --no-graphics --resume",
	"mlagents_version": "1.2.0.dev0",
	"mlagents_envs_version": "1.2.0.dev0",
	"communication_protocol_version": "1.5.0",
	"pytorch_version": "2.7.1+cu126",
	"numpy_version": "1.23.5",
	"end_time_seconds": "1752611128"
	},
	"total": 3452.413145898001,
	"count": 1,
	"self": 1.141851158999998,
	"children": {
	"run_training.setup": {
	"total": 0.04782425800112833,
	"count": 1,
	"self": 0.04782425800112833
	},
	"TrainerController.start_learning": {
	"total": 3451.223470481,
	"count": 1,
	"self": 2.3732128570936766,
	"children": {
	"TrainerController._reset_env": {
	"total": 3.8553263949997927,
	"count": 1,
	"self": 3.8553263949997927
	},
	"TrainerController.advance": {
	"total": 3444.985487246906,
	"count": 54374,
	"self": 2.6153873088951514,
	"children": {
	"env_step": {
	"total": 2473.174419440069,
	"count": 54374,
	"self": 2323.5796925855357,
	"children": {
	"SubprocessEnvManager._take_step": {
	"total": 148.17614540590876,
	"count": 54374,
	"self": 6.909613850857568,
	"children": {
	"TorchPolicy.evaluate": {
	"total": 141.2665315550512,
	"count": 51630,
	"self": 141.2665315550512
	}
	}
	},
	"workers": {
	"total": 1.4185814486245363,
	"count": 54374,
	"self": 0.0,
	"children": {
	"worker_root": {
	"total": 3442.0139552039436,
	"count": 54374,
	"is_parallel": true,
	"self": 1292.3154535910217,
	"children": {
	"run_training.setup": {
	"total": 0.0,
	"count": 0,
	"is_parallel": true,
	"self": 0.0,
	"children": {
	"steps_from_proto": {
	"total": 0.0032977760001813294,
	"count": 1,
	"is_parallel": true,
	"self": 0.0009555380001984304,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 0.002342237999982899,
	"count": 8,
	"is_parallel": true,
	"self": 0.002342237999982899
	}
	}
	},
	"UnityEnvironment.step": {
	"total": 0.07654789699881803,
	"count": 1,
	"is_parallel": true,
	"self": 0.0007555769989266992,
	"children": {
	"UnityEnvironment._generate_step_input": {
	"total": 0.0006237380002858117,
	"count": 1,
	"is_parallel": true,
	"self": 0.0006237380002858117
	},
	"communicator.exchange": {
	"total": 0.07307490799939842,
	"count": 1,
	"is_parallel": true,
	"self": 0.07307490799939842
	},
	"steps_from_proto": {
	"total": 0.002093674000207102,
	"count": 1,
	"is_parallel": true,
	"self": 0.0004639890030375682,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 0.0016296849971695337,
	"count": 8,
	"is_parallel": true,
	"self": 0.0016296849971695337
	}
	}
	}
	}
	}
	}
	},
	"UnityEnvironment.step": {
	"total": 2149.698501612922,
	"count": 54373,
	"is_parallel": true,
	"self": 41.98684660366598,
	"children": {
	"UnityEnvironment._generate_step_input": {
	"total": 28.251620290124265,
	"count": 54373,
	"is_parallel": true,
	"self": 28.251620290124265
	},
	"communicator.exchange": {
	"total": 1962.164245098813,
	"count": 54373,
	"is_parallel": true,
	"self": 1962.164245098813
	},
	"steps_from_proto": {
	"total": 117.29578962031883,
	"count": 54373,
	"is_parallel": true,
	"self": 26.28809506757716,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 91.00769455274167,
	"count": 434984,
	"is_parallel": true,
	"self": 91.00769455274167
	}
	}
	}
	}
	}
	}
	}
	}
	}
	}
	},
	"trainer_advance": {
	"total": 969.1956804979418,
	"count": 54374,
	"self": 5.1387520592816145,
	"children": {
	"process_trajectory": {
	"total": 159.55085079067612,
	"count": 54374,
	"self": 159.33494666267688,
	"children": {
	"RLTrainer._checkpoint": {
	"total": 0.21590412799923797,
	"count": 2,
	"self": 0.21590412799923797
	}
	}
	},
	"_update_policy": {
	"total": 804.5060776479841,
	"count": 390,
	"self": 317.23073637292146,
	"children": {
	"TorchPPOOptimizer.update": {
	"total": 487.2753412750626,
	"count": 18758,
	"self": 487.2753412750626
	}
	}
	}
	}
	}
	}
	},
	"trainer_threads": {
	"total": 1.8539994925959036e-06,
	"count": 1,
	"self": 1.8539994925959036e-06
	},
	"TrainerController._save_models": {
	"total": 0.009442128000955563,
	"count": 1,
	"self": 6.396600110747386e-05,
	"children": {
	"RLTrainer._checkpoint": {
	"total": 0.00937816199984809,
	"count": 1,
	"self": 0.00937816199984809
	}
	}
	}
	}
	}
	}
	}