First push

5ca6bb6 verified 11 months ago

18.2 kB

	{
	"name": "root",
	"gauges": {
	"Pyramids.Policy.Entropy.mean": {
	"value": 0.9925450086593628,
	"min": 0.9847832918167114,
	"max": 1.466425895690918,
	"count": 5
	},
	"Pyramids.Policy.Entropy.sum": {
	"value": 30316.294921875,
	"min": 29496.228515625,
	"max": 44485.49609375,
	"count": 5
	},
	"Pyramids.Step.mean": {
	"value": 149970.0,
	"min": 29952.0,
	"max": 149970.0,
	"count": 5
	},
	"Pyramids.Step.sum": {
	"value": 149970.0,
	"min": 29952.0,
	"max": 149970.0,
	"count": 5
	},
	"Pyramids.Policy.ExtrinsicValueEstimate.mean": {
	"value": -0.11928949505090714,
	"min": -0.11928949505090714,
	"max": 0.007646649144589901,
	"count": 5
	},
	"Pyramids.Policy.ExtrinsicValueEstimate.sum": {
	"value": -28.748767852783203,
	"min": -28.748767852783203,
	"max": 1.812255859375,
	"count": 5
	},
	"Pyramids.Policy.RndValueEstimate.mean": {
	"value": 0.08848647773265839,
	"min": 0.08848647773265839,
	"max": 0.4663185477256775,
	"count": 5
	},
	"Pyramids.Policy.RndValueEstimate.sum": {
	"value": 21.325241088867188,
	"min": 21.325241088867188,
	"max": 110.51749420166016,
	"count": 5
	},
	"Pyramids.Losses.PolicyLoss.mean": {
	"value": 0.07245683489965793,
	"min": 0.07033540763214483,
	"max": 0.07588012771551118,
	"count": 5
	},
	"Pyramids.Losses.PolicyLoss.sum": {
	"value": 0.7970251838962372,
	"min": 0.5065388291637312,
	"max": 0.7970251838962372,
	"count": 5
	},
	"Pyramids.Losses.ValueLoss.mean": {
	"value": 0.0005877865855996381,
	"min": 0.0005877865855996381,
	"max": 0.009045908642764408,
	"count": 5
	},
	"Pyramids.Losses.ValueLoss.sum": {
	"value": 0.006465652441596019,
	"min": 0.00532774068794121,
	"max": 0.06332136049935086,
	"count": 5
	},
	"Pyramids.Policy.LearningRate.mean": {
	"value": 0.00028655179539182723,
	"min": 0.00028655179539182723,
	"max": 0.00029838354339596195,
	"count": 5
	},
	"Pyramids.Policy.LearningRate.sum": {
	"value": 0.0031520697493100996,
	"min": 0.0020691136102954665,
	"max": 0.0031520697493100996,
	"count": 5
	},
	"Pyramids.Policy.Epsilon.mean": {
	"value": 0.19551726363636365,
	"min": 0.19551726363636365,
	"max": 0.19946118095238097,
	"count": 5
	},
	"Pyramids.Policy.Epsilon.sum": {
	"value": 2.1506899,
	"min": 1.3897045333333333,
	"max": 2.1506899,
	"count": 5
	},
	"Pyramids.Policy.Beta.mean": {
	"value": 0.009552174637272728,
	"min": 0.009552174637272728,
	"max": 0.009946171977142856,
	"count": 5
	},
	"Pyramids.Policy.Beta.sum": {
	"value": 0.10507392101,
	"min": 0.06897148288,
	"max": 0.10507392101,
	"count": 5
	},
	"Pyramids.Losses.RNDLoss.mean": {
	"value": 0.0687025710940361,
	"min": 0.0687025710940361,
	"max": 0.45670634508132935,
	"count": 5
	},
	"Pyramids.Losses.RNDLoss.sum": {
	"value": 0.7557282447814941,
	"min": 0.7099942564964294,
	"max": 3.19694447517395,
	"count": 5
	},
	"Pyramids.Environment.EpisodeLength.mean": {
	"value": 996.15625,
	"min": 984.40625,
	"max": 999.0,
	"count": 5
	},
	"Pyramids.Environment.EpisodeLength.sum": {
	"value": 31877.0,
	"min": 15984.0,
	"max": 31968.0,
	"count": 5
	},
	"Pyramids.Environment.CumulativeReward.mean": {
	"value": -0.9346125507727265,
	"min": -1.0000000521540642,
	"max": -0.9228750506881624,
	"count": 5
	},
	"Pyramids.Environment.CumulativeReward.sum": {
	"value": -29.90760162472725,
	"min": -32.000001668930054,
	"max": -16.000000834465027,
	"count": 5
	},
	"Pyramids.Policy.ExtrinsicReward.mean": {
	"value": -0.9346125507727265,
	"min": -1.0000000521540642,
	"max": -0.9228750506881624,
	"count": 5
	},
	"Pyramids.Policy.ExtrinsicReward.sum": {
	"value": -29.90760162472725,
	"min": -32.000001668930054,
	"max": -16.000000834465027,
	"count": 5
	},
	"Pyramids.Policy.RndReward.mean": {
	"value": 0.7536459516268224,
	"min": 0.7536459516268224,
	"max": 8.610899567604065,
	"count": 5
	},
	"Pyramids.Policy.RndReward.sum": {
	"value": 24.116670452058315,
	"min": 24.116670452058315,
	"max": 137.77439308166504,
	"count": 5
	},
	"Pyramids.IsTraining.mean": {
	"value": 1.0,
	"min": 1.0,
	"max": 1.0,
	"count": 5
	},
	"Pyramids.IsTraining.sum": {
	"value": 1.0,
	"min": 1.0,
	"max": 1.0,
	"count": 5
	}
	},
	"metadata": {
	"timer_format_version": "0.1.0",
	"start_time_seconds": "1748528443",
	"python_version": "3.10.12 (main, Jul 5 2023, 18:54:27) [GCC 11.2.0]",
	"command_line_arguments": "/usr/local/bin/mlagents-learn ./config/ppo/PyramidsRND.yaml --env=./training-envs-executables/linux/Pyramids/Pyramids --run-id=Pyramids Training --no-graphics",
	"mlagents_version": "1.2.0.dev0",
	"mlagents_envs_version": "1.2.0.dev0",
	"communication_protocol_version": "1.5.0",
	"pytorch_version": "2.7.0+cu126",
	"numpy_version": "1.23.5",
	"end_time_seconds": "1748528788"
	},
	"total": 344.56960941700004,
	"count": 1,
	"self": 0.5216151859999627,
	"children": {
	"run_training.setup": {
	"total": 0.021093043000064426,
	"count": 1,
	"self": 0.021093043000064426
	},
	"TrainerController.start_learning": {
	"total": 344.026901188,
	"count": 1,
	"self": 0.2570713980030632,
	"children": {
	"TrainerController._reset_env": {
	"total": 2.447821465000061,
	"count": 1,
	"self": 2.447821465000061
	},
	"TrainerController.advance": {
	"total": 340.9616144319971,
	"count": 9783,
	"self": 0.28863897802102656,
	"children": {
	"env_step": {
	"total": 228.421792245995,
	"count": 9783,
	"self": 200.272148808986,
	"children": {
	"SubprocessEnvManager._take_step": {
	"total": 28.000657919996,
	"count": 9783,
	"self": 0.8493236969950431,
	"children": {
	"TorchPolicy.evaluate": {
	"total": 27.15133422300096,
	"count": 9781,
	"self": 27.15133422300096
	}
	}
	},
	"workers": {
	"total": 0.14898551701298857,
	"count": 9782,
	"self": 0.0,
	"children": {
	"worker_root": {
	"total": 342.82997307999176,
	"count": 9782,
	"is_parallel": true,
	"self": 162.237793356976,
	"children": {
	"run_training.setup": {
	"total": 0.0,
	"count": 0,
	"is_parallel": true,
	"self": 0.0,
	"children": {
	"steps_from_proto": {
	"total": 0.0021176360000936256,
	"count": 1,
	"is_parallel": true,
	"self": 0.0006946779999452701,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 0.0014229580001483555,
	"count": 8,
	"is_parallel": true,
	"self": 0.0014229580001483555
	}
	}
	},
	"UnityEnvironment.step": {
	"total": 0.05272724099995685,
	"count": 1,
	"is_parallel": true,
	"self": 0.0006332640000437095,
	"children": {
	"UnityEnvironment._generate_step_input": {
	"total": 0.0005856350001067767,
	"count": 1,
	"is_parallel": true,
	"self": 0.0005856350001067767
	},
	"communicator.exchange": {
	"total": 0.04968257099994844,
	"count": 1,
	"is_parallel": true,
	"self": 0.04968257099994844
	},
	"steps_from_proto": {
	"total": 0.001825770999857923,
	"count": 1,
	"is_parallel": true,
	"self": 0.0004133489997002471,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 0.001412422000157676,
	"count": 8,
	"is_parallel": true,
	"self": 0.001412422000157676
	}
	}
	}
	}
	}
	}
	},
	"UnityEnvironment.step": {
	"total": 180.59217972301576,
	"count": 9781,
	"is_parallel": true,
	"self": 5.447545174037259,
	"children": {
	"UnityEnvironment._generate_step_input": {
	"total": 4.101706276997675,
	"count": 9781,
	"is_parallel": true,
	"self": 4.101706276997675
	},
	"communicator.exchange": {
	"total": 154.1020959519915,
	"count": 9781,
	"is_parallel": true,
	"self": 154.1020959519915
	},
	"steps_from_proto": {
	"total": 16.94083231998934,
	"count": 9781,
	"is_parallel": true,
	"self": 3.5175229909548307,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 13.42330932903451,
	"count": 78248,
	"is_parallel": true,
	"self": 13.42330932903451
	}
	}
	}
	}
	}
	}
	}
	}
	}
	}
	},
	"trainer_advance": {
	"total": 112.25118320798106,
	"count": 9782,
	"self": 0.3296399020075569,
	"children": {
	"process_trajectory": {
	"total": 21.554079229972558,
	"count": 9782,
	"self": 21.554079229972558
	},
	"_update_policy": {
	"total": 90.36746407600094,
	"count": 43,
	"self": 50.6577351279966,
	"children": {
	"TorchPPOOptimizer.update": {
	"total": 39.70972894800434,
	"count": 3597,
	"self": 39.70972894800434
	}
	}
	}
	}
	}
	}
	},
	"trainer_threads": {
	"total": 1.2549999155453406e-06,
	"count": 1,
	"self": 1.2549999155453406e-06
	},
	"TrainerController._save_models": {
	"total": 0.36039263799989385,
	"count": 1,
	"self": 0.0037798139999267732,
	"children": {
	"RLTrainer._checkpoint": {
	"total": 0.3566128239999671,
	"count": 1,
	"self": 0.3566128239999671
	}
	}
	}
	}
	}
	}
	}