First Push

2b4b864 verified about 2 years ago

18.4 kB

	{
	"name": "root",
	"gauges": {
	"Pyramids.Policy.Entropy.mean": {
	"value": 0.599629819393158,
	"min": 0.5059385299682617,
	"max": 1.3475011587142944,
	"count": 10
	},
	"Pyramids.Policy.Entropy.sum": {
	"value": 18056.052734375,
	"min": 15234.8212890625,
	"max": 40877.796875,
	"count": 10
	},
	"Pyramids.Step.mean": {
	"value": 299937.0,
	"min": 29876.0,
	"max": 299937.0,
	"count": 10
	},
	"Pyramids.Step.sum": {
	"value": 299937.0,
	"min": 29876.0,
	"max": 299937.0,
	"count": 10
	},
	"Pyramids.Policy.ExtrinsicValueEstimate.mean": {
	"value": -0.06407999992370605,
	"min": -0.08377300947904587,
	"max": 0.1260421872138977,
	"count": 10
	},
	"Pyramids.Policy.ExtrinsicValueEstimate.sum": {
	"value": -15.443279266357422,
	"min": -20.189294815063477,
	"max": 29.871997833251953,
	"count": 10
	},
	"Pyramids.Policy.RndValueEstimate.mean": {
	"value": 0.03486521169543266,
	"min": 0.03486521169543266,
	"max": 0.4703199863433838,
	"count": 10
	},
	"Pyramids.Policy.RndValueEstimate.sum": {
	"value": 8.40251636505127,
	"min": 8.40251636505127,
	"max": 111.46583557128906,
	"count": 10
	},
	"Pyramids.Losses.PolicyLoss.mean": {
	"value": 0.06665528073668651,
	"min": 0.0659730467887623,
	"max": 0.0708409442319011,
	"count": 10
	},
	"Pyramids.Losses.PolicyLoss.sum": {
	"value": 0.9331739303136112,
	"min": 0.5435417446077209,
	"max": 0.9760828728780373,
	"count": 10
	},
	"Pyramids.Losses.ValueLoss.mean": {
	"value": 0.0013290936716116725,
	"min": 0.0008538765170754994,
	"max": 0.007949723781564465,
	"count": 10
	},
	"Pyramids.Losses.ValueLoss.sum": {
	"value": 0.018607311402563415,
	"min": 0.010246518204905993,
	"max": 0.06359779025251572,
	"count": 10
	},
	"Pyramids.Policy.LearningRate.mean": {
	"value": 1.573402332678572e-05,
	"min": 1.573402332678572e-05,
	"max": 0.00028281175572941665,
	"count": 10
	},
	"Pyramids.Policy.LearningRate.sum": {
	"value": 0.00022027632657500005,
	"min": 0.00022027632657500005,
	"max": 0.003053585182138333,
	"count": 10
	},
	"Pyramids.Policy.Epsilon.mean": {
	"value": 0.10524464285714287,
	"min": 0.10524464285714287,
	"max": 0.19427058333333336,
	"count": 10
	},
	"Pyramids.Policy.Epsilon.sum": {
	"value": 1.4734250000000002,
	"min": 1.4734250000000002,
	"max": 2.217861666666667,
	"count": 10
	},
	"Pyramids.Policy.Beta.mean": {
	"value": 0.0005339398214285715,
	"min": 0.0005339398214285715,
	"max": 0.009427631275,
	"count": 10
	},
	"Pyramids.Policy.Beta.sum": {
	"value": 0.007475157500000001,
	"min": 0.007475157500000001,
	"max": 0.10180438049999999,
	"count": 10
	},
	"Pyramids.Losses.RNDLoss.mean": {
	"value": 0.0322943739593029,
	"min": 0.0322943739593029,
	"max": 0.5086736083030701,
	"count": 10
	},
	"Pyramids.Losses.RNDLoss.sum": {
	"value": 0.45212122797966003,
	"min": 0.45212122797966003,
	"max": 4.0693888664245605,
	"count": 10
	},
	"Pyramids.Environment.EpisodeLength.mean": {
	"value": 982.6666666666666,
	"min": 906.5714285714286,
	"max": 998.2666666666667,
	"count": 10
	},
	"Pyramids.Environment.EpisodeLength.sum": {
	"value": 32428.0,
	"min": 17186.0,
	"max": 33298.0,
	"count": 10
	},
	"Pyramids.Environment.CumulativeReward.mean": {
	"value": -0.8620970204020991,
	"min": -0.9324333834151427,
	"max": -0.47850004583597183,
	"count": 10
	},
	"Pyramids.Environment.CumulativeReward.sum": {
	"value": -28.449201673269272,
	"min": -29.327601686120033,
	"max": -13.202000856399536,
	"count": 10
	},
	"Pyramids.Policy.ExtrinsicReward.mean": {
	"value": -0.8620970204020991,
	"min": -0.9324333834151427,
	"max": -0.47850004583597183,
	"count": 10
	},
	"Pyramids.Policy.ExtrinsicReward.sum": {
	"value": -28.449201673269272,
	"min": -29.327601686120033,
	"max": -13.202000856399536,
	"count": 10
	},
	"Pyramids.Policy.RndReward.mean": {
	"value": 0.3238650124068513,
	"min": 0.3238650124068513,
	"max": 9.837597578763962,
	"count": 10
	},
	"Pyramids.Policy.RndReward.sum": {
	"value": 10.687545409426093,
	"min": 10.11720191128552,
	"max": 177.0767564177513,
	"count": 10
	},
	"Pyramids.IsTraining.mean": {
	"value": 1.0,
	"min": 1.0,
	"max": 1.0,
	"count": 10
	},
	"Pyramids.IsTraining.sum": {
	"value": 1.0,
	"min": 1.0,
	"max": 1.0,
	"count": 10
	}
	},
	"metadata": {
	"timer_format_version": "0.1.0",
	"start_time_seconds": "1710323913",
	"python_version": "3.10.12 (main, Nov 20 2023, 15:14:05) [GCC 11.4.0]",
	"command_line_arguments": "/usr/local/bin/mlagents-learn ./config/ppo/PyramidsRND.yaml --env=./training-envs-executables/linux/Pyramids/Pyramids --run-id=Pyramids Training --no-graphics",
	"mlagents_version": "1.1.0.dev0",
	"mlagents_envs_version": "1.1.0.dev0",
	"communication_protocol_version": "1.5.0",
	"pytorch_version": "2.2.1+cu121",
	"numpy_version": "1.23.5",
	"end_time_seconds": "1710324533"
	},
	"total": 620.057915522,
	"count": 1,
	"self": 0.4871585920000143,
	"children": {
	"run_training.setup": {
	"total": 0.049293196999997235,
	"count": 1,
	"self": 0.049293196999997235
	},
	"TrainerController.start_learning": {
	"total": 619.521463733,
	"count": 1,
	"self": 0.3832185879816734,
	"children": {
	"TrainerController._reset_env": {
	"total": 2.2970554870000797,
	"count": 1,
	"self": 2.2970554870000797
	},
	"TrainerController.advance": {
	"total": 616.7305033180185,
	"count": 18939,
	"self": 0.4071372580162915,
	"children": {
	"env_step": {
	"total": 434.62161004100517,
	"count": 18939,
	"self": 394.4325869120273,
	"children": {
	"SubprocessEnvManager._take_step": {
	"total": 39.93781932799084,
	"count": 18939,
	"self": 1.419481331971383,
	"children": {
	"TorchPolicy.evaluate": {
	"total": 38.518337996019454,
	"count": 18801,
	"self": 38.518337996019454
	}
	}
	},
	"workers": {
	"total": 0.2512038009870139,
	"count": 18939,
	"self": 0.0,
	"children": {
	"worker_root": {
	"total": 617.9181912310048,
	"count": 18939,
	"is_parallel": true,
	"self": 259.496082748002,
	"children": {
	"run_training.setup": {
	"total": 0.0,
	"count": 0,
	"is_parallel": true,
	"self": 0.0,
	"children": {
	"steps_from_proto": {
	"total": 0.0021149589999822638,
	"count": 1,
	"is_parallel": true,
	"self": 0.0006936429997494997,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 0.001421316000232764,
	"count": 8,
	"is_parallel": true,
	"self": 0.001421316000232764
	}
	}
	},
	"UnityEnvironment.step": {
	"total": 0.11306079400014823,
	"count": 1,
	"is_parallel": true,
	"self": 0.0006469720003678958,
	"children": {
	"UnityEnvironment._generate_step_input": {
	"total": 0.00048515499997847655,
	"count": 1,
	"is_parallel": true,
	"self": 0.00048515499997847655
	},
	"communicator.exchange": {
	"total": 0.11005449299977954,
	"count": 1,
	"is_parallel": true,
	"self": 0.11005449299977954
	},
	"steps_from_proto": {
	"total": 0.0018741740000223217,
	"count": 1,
	"is_parallel": true,
	"self": 0.0004333500000939239,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 0.0014408239999283978,
	"count": 8,
	"is_parallel": true,
	"self": 0.0014408239999283978
	}
	}
	}
	}
	}
	}
	},
	"UnityEnvironment.step": {
	"total": 358.42210848300283,
	"count": 18938,
	"is_parallel": true,
	"self": 10.17915077599082,
	"children": {
	"UnityEnvironment._generate_step_input": {
	"total": 7.354304913994156,
	"count": 18938,
	"is_parallel": true,
	"self": 7.354304913994156
	},
	"communicator.exchange": {
	"total": 310.45844801000817,
	"count": 18938,
	"is_parallel": true,
	"self": 310.45844801000817
	},
	"steps_from_proto": {
	"total": 30.430204783009685,
	"count": 18938,
	"is_parallel": true,
	"self": 6.190673180028625,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 24.23953160298106,
	"count": 151504,
	"is_parallel": true,
	"self": 24.23953160298106
	}
	}
	}
	}
	}
	}
	}
	}
	}
	}
	},
	"trainer_advance": {
	"total": 181.701756018997,
	"count": 18939,
	"self": 0.6548334029737362,
	"children": {
	"process_trajectory": {
	"total": 37.35671043802154,
	"count": 18939,
	"self": 37.35671043802154
	},
	"_update_policy": {
	"total": 143.69021217800173,
	"count": 127,
	"self": 83.25335949400755,
	"children": {
	"TorchPPOOptimizer.update": {
	"total": 60.436852683994175,
	"count": 6825,
	"self": 60.436852683994175
	}
	}
	}
	}
	}
	}
	},
	"trainer_threads": {
	"total": 1.2549999155453406e-06,
	"count": 1,
	"self": 1.2549999155453406e-06
	},
	"TrainerController._save_models": {
	"total": 0.11068508499988639,
	"count": 1,
	"self": 0.001532421999854705,
	"children": {
	"RLTrainer._checkpoint": {
	"total": 0.10915266300003168,
	"count": 1,
	"self": 0.10915266300003168
	}
	}
	}
	}
	}
	}
	}