Pyramids first push

6442d27 over 2 years ago

18.8 kB

	{
	"name": "root",
	"gauges": {
	"Pyramids.Policy.Entropy.mean": {
	"value": 0.29915913939476013,
	"min": 0.28410860896110535,
	"max": 1.5636372566223145,
	"count": 50
	},
	"Pyramids.Policy.Entropy.sum": {
	"value": 8879.04296875,
	"min": 8564.169921875,
	"max": 47434.5,
	"count": 50
	},
	"Pyramids.Step.mean": {
	"value": 1499986.0,
	"min": 29952.0,
	"max": 1499986.0,
	"count": 50
	},
	"Pyramids.Step.sum": {
	"value": 1499986.0,
	"min": 29952.0,
	"max": 1499986.0,
	"count": 50
	},
	"Pyramids.Policy.ExtrinsicValueEstimate.mean": {
	"value": 0.6056761145591736,
	"min": -0.09941365569829941,
	"max": 0.70343017578125,
	"count": 50
	},
	"Pyramids.Policy.ExtrinsicValueEstimate.sum": {
	"value": 171.40634155273438,
	"min": -23.859277725219727,
	"max": 203.29132080078125,
	"count": 50
	},
	"Pyramids.Policy.RndValueEstimate.mean": {
	"value": 0.029083063825964928,
	"min": -0.05323021486401558,
	"max": 0.046292513608932495,
	"count": 50
	},
	"Pyramids.Policy.RndValueEstimate.sum": {
	"value": 8.230506896972656,
	"min": -12.615560531616211,
	"max": 11.156496047973633,
	"count": 50
	},
	"Pyramids.Losses.PolicyLoss.mean": {
	"value": 0.06749800125059362,
	"min": 0.0645788092425348,
	"max": 0.07387033428642012,
	"count": 50
	},
	"Pyramids.Losses.PolicyLoss.sum": {
	"value": 0.9449720175083106,
	"min": 0.5122415571954924,
	"max": 1.0787357757867808,
	"count": 50
	},
	"Pyramids.Losses.ValueLoss.mean": {
	"value": 0.01635693196329244,
	"min": 5.1410141096389446e-05,
	"max": 0.018066525813386157,
	"count": 50
	},
	"Pyramids.Losses.ValueLoss.sum": {
	"value": 0.22899704748609415,
	"min": 0.0006683318342530628,
	"max": 0.2529313613874062,
	"count": 50
	},
	"Pyramids.Policy.LearningRate.mean": {
	"value": 2.920927597819051e-06,
	"min": 2.920927597819051e-06,
	"max": 0.00029676708679192377,
	"count": 50
	},
	"Pyramids.Policy.LearningRate.sum": {
	"value": 4.0892986369466716e-05,
	"min": 4.0892986369466716e-05,
	"max": 0.0033499776833407994,
	"count": 50
	},
	"Pyramids.Policy.Epsilon.mean": {
	"value": 0.10097360952380953,
	"min": 0.10097360952380953,
	"max": 0.19892236190476195,
	"count": 50
	},
	"Pyramids.Policy.Epsilon.sum": {
	"value": 1.4136305333333334,
	"min": 1.3924565333333336,
	"max": 2.4779453999999994,
	"count": 50
	},
	"Pyramids.Policy.Beta.mean": {
	"value": 0.00010726359142857153,
	"min": 0.00010726359142857153,
	"max": 0.009892343954285714,
	"count": 50
	},
	"Pyramids.Policy.Beta.sum": {
	"value": 0.0015016902800000015,
	"min": 0.0015016902800000015,
	"max": 0.11167425408,
	"count": 50
	},
	"Pyramids.Losses.RNDLoss.mean": {
	"value": 0.003088225843384862,
	"min": 0.003088225843384862,
	"max": 0.08980808407068253,
	"count": 50
	},
	"Pyramids.Losses.RNDLoss.sum": {
	"value": 0.043235160410404205,
	"min": 0.043235160410404205,
	"max": 0.6286565661430359,
	"count": 50
	},
	"Pyramids.Environment.EpisodeLength.mean": {
	"value": 294.61052631578946,
	"min": 260.6371681415929,
	"max": 999.0,
	"count": 50
	},
	"Pyramids.Environment.EpisodeLength.sum": {
	"value": 27988.0,
	"min": 15984.0,
	"max": 32331.0,
	"count": 50
	},
	"Pyramids.Environment.CumulativeReward.mean": {
	"value": 1.6632673507458284,
	"min": -1.0000000521540642,
	"max": 1.7258411051235467,
	"count": 50
	},
	"Pyramids.Environment.CumulativeReward.sum": {
	"value": 158.0103983208537,
	"min": -31.99920167028904,
	"max": 192.54659831523895,
	"count": 50
	},
	"Pyramids.Policy.ExtrinsicReward.mean": {
	"value": 1.6632673507458284,
	"min": -1.0000000521540642,
	"max": 1.7258411051235467,
	"count": 50
	},
	"Pyramids.Policy.ExtrinsicReward.sum": {
	"value": 158.0103983208537,
	"min": -31.99920167028904,
	"max": 192.54659831523895,
	"count": 50
	},
	"Pyramids.Policy.RndReward.mean": {
	"value": 0.00949731385720186,
	"min": 0.00925837562298294,
	"max": 2.0735077019780874,
	"count": 50
	},
	"Pyramids.Policy.RndReward.sum": {
	"value": 0.9022448164341768,
	"min": 0.9022448164341768,
	"max": 33.1761232316494,
	"count": 50
	},
	"Pyramids.IsTraining.mean": {
	"value": 1.0,
	"min": 1.0,
	"max": 1.0,
	"count": 50
	},
	"Pyramids.IsTraining.sum": {
	"value": 1.0,
	"min": 1.0,
	"max": 1.0,
	"count": 50
	}
	},
	"metadata": {
	"timer_format_version": "0.1.0",
	"start_time_seconds": "1692519392",
	"python_version": "3.10.12 (main, Jun 11 2023, 05:26:28) [GCC 11.4.0]",
	"command_line_arguments": "/usr/local/bin/mlagents-learn ./config/ppo/PyramidsRND.yaml --env=./training-envs-executables/linux/Pyramids/Pyramids --run-id=Pyramids Training 2 --no-graphics",
	"mlagents_version": "0.31.0.dev0",
	"mlagents_envs_version": "0.31.0.dev0",
	"communication_protocol_version": "1.5.0",
	"pytorch_version": "1.11.0+cu102",
	"numpy_version": "1.21.2",
	"end_time_seconds": "1692522895"
	},
	"total": 3502.9596972140007,
	"count": 1,
	"self": 0.47587667900006636,
	"children": {
	"run_training.setup": {
	"total": 0.03943244499987486,
	"count": 1,
	"self": 0.03943244499987486
	},
	"TrainerController.start_learning": {
	"total": 3502.4443880900008,
	"count": 1,
	"self": 2.1719298980442545,
	"children": {
	"TrainerController._reset_env": {
	"total": 3.9438994219999586,
	"count": 1,
	"self": 3.9438994219999586
	},
	"TrainerController.advance": {
	"total": 3496.227934853957,
	"count": 96019,
	"self": 2.1923658319446986,
	"children": {
	"env_step": {
	"total": 2496.282318781954,
	"count": 96019,
	"self": 2323.6505030061444,
	"children": {
	"SubprocessEnvManager._take_step": {
	"total": 171.34090609513623,
	"count": 96019,
	"self": 7.490892098382574,
	"children": {
	"TorchPolicy.evaluate": {
	"total": 163.85001399675366,
	"count": 93816,
	"self": 163.85001399675366
	}
	}
	},
	"workers": {
	"total": 1.2909096806733942,
	"count": 96019,
	"self": 0.0,
	"children": {
	"worker_root": {
	"total": 3494.2376615598205,
	"count": 96019,
	"is_parallel": true,
	"self": 1354.1216041257712,
	"children": {
	"run_training.setup": {
	"total": 0.0,
	"count": 0,
	"is_parallel": true,
	"self": 0.0,
	"children": {
	"steps_from_proto": {
	"total": 0.0019422639998083469,
	"count": 1,
	"is_parallel": true,
	"self": 0.0006881150011395221,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 0.0012541489986688248,
	"count": 8,
	"is_parallel": true,
	"self": 0.0012541489986688248
	}
	}
	},
	"UnityEnvironment.step": {
	"total": 0.05570035900018411,
	"count": 1,
	"is_parallel": true,
	"self": 0.0006343960003505345,
	"children": {
	"UnityEnvironment._generate_step_input": {
	"total": 0.0006096659999457188,
	"count": 1,
	"is_parallel": true,
	"self": 0.0006096659999457188
	},
	"communicator.exchange": {
	"total": 0.05234674700022879,
	"count": 1,
	"is_parallel": true,
	"self": 0.05234674700022879
	},
	"steps_from_proto": {
	"total": 0.002109549999659066,
	"count": 1,
	"is_parallel": true,
	"self": 0.0004419409997353796,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 0.0016676089999236865,
	"count": 8,
	"is_parallel": true,
	"self": 0.0016676089999236865
	}
	}
	}
	}
	}
	}
	},
	"UnityEnvironment.step": {
	"total": 2140.1160574340493,
	"count": 96018,
	"is_parallel": true,
	"self": 52.06851173504401,
	"children": {
	"UnityEnvironment._generate_step_input": {
	"total": 36.57885612815335,
	"count": 96018,
	"is_parallel": true,
	"self": 36.57885612815335
	},
	"communicator.exchange": {
	"total": 1881.6948344339062,
	"count": 96018,
	"is_parallel": true,
	"self": 1881.6948344339062
	},
	"steps_from_proto": {
	"total": 169.7738551369457,
	"count": 96018,
	"is_parallel": true,
	"self": 34.172791839220736,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 135.60106329772498,
	"count": 768144,
	"is_parallel": true,
	"self": 135.60106329772498
	}
	}
	}
	}
	}
	}
	}
	}
	}
	}
	},
	"trainer_advance": {
	"total": 997.7532502400582,
	"count": 96019,
	"self": 4.0224143680216,
	"children": {
	"process_trajectory": {
	"total": 174.90187697804777,
	"count": 96019,
	"self": 174.59119515204748,
	"children": {
	"RLTrainer._checkpoint": {
	"total": 0.31068182600029104,
	"count": 3,
	"self": 0.31068182600029104
	}
	}
	},
	"_update_policy": {
	"total": 818.8289588939888,
	"count": 675,
	"self": 536.3215708619209,
	"children": {
	"TorchPPOOptimizer.update": {
	"total": 282.50738803206787,
	"count": 34212,
	"self": 282.50738803206787
	}
	}
	}
	}
	}
	}
	},
	"trainer_threads": {
	"total": 1.0139992809854448e-06,
	"count": 1,
	"self": 1.0139992809854448e-06
	},
	"TrainerController._save_models": {
	"total": 0.1006229020003957,
	"count": 1,
	"self": 0.0015464750013052253,
	"children": {
	"RLTrainer._checkpoint": {
	"total": 0.09907642699909047,
	"count": 1,
	"self": 0.09907642699909047
	}
	}
	}
	}
	}
	}
	}