| { |
| "name": "root", |
| "gauges": { |
| "Pyramids.Policy.Entropy.mean": { |
| "value": 0.20883840322494507, |
| "min": 0.19934269785881042, |
| "max": 1.4834659099578857, |
| "count": 100 |
| }, |
| "Pyramids.Policy.Entropy.sum": { |
| "value": 6305.2490234375, |
| "min": 5968.60498046875, |
| "max": 45002.421875, |
| "count": 100 |
| }, |
| "Pyramids.Step.mean": { |
| "value": 2999875.0, |
| "min": 29952.0, |
| "max": 2999875.0, |
| "count": 100 |
| }, |
| "Pyramids.Step.sum": { |
| "value": 2999875.0, |
| "min": 29952.0, |
| "max": 2999875.0, |
| "count": 100 |
| }, |
| "Pyramids.Policy.ExtrinsicValueEstimate.mean": { |
| "value": 0.798509418964386, |
| "min": -0.08498506247997284, |
| "max": 0.8286927938461304, |
| "count": 100 |
| }, |
| "Pyramids.Policy.ExtrinsicValueEstimate.sum": { |
| "value": 242.7468719482422, |
| "min": -20.56638526916504, |
| "max": 249.4365234375, |
| "count": 100 |
| }, |
| "Pyramids.Policy.RndValueEstimate.mean": { |
| "value": 0.00782564003020525, |
| "min": -0.02389027550816536, |
| "max": 0.3482888638973236, |
| "count": 100 |
| }, |
| "Pyramids.Policy.RndValueEstimate.sum": { |
| "value": 2.3789947032928467, |
| "min": -6.2114715576171875, |
| "max": 83.58932495117188, |
| "count": 100 |
| }, |
| "Pyramids.Losses.PolicyLoss.mean": { |
| "value": 0.0685256353345245, |
| "min": 0.06373710363663525, |
| "max": 0.07483905499980742, |
| "count": 100 |
| }, |
| "Pyramids.Losses.PolicyLoss.sum": { |
| "value": 0.9593588946833431, |
| "min": 0.48028539652994195, |
| "max": 1.1069516701362434, |
| "count": 100 |
| }, |
| "Pyramids.Losses.ValueLoss.mean": { |
| "value": 0.015294011145929936, |
| "min": 0.000883022911804011, |
| "max": 0.016372764399125182, |
| "count": 100 |
| }, |
| "Pyramids.Losses.ValueLoss.sum": { |
| "value": 0.21411615604301912, |
| "min": 0.010596274941648132, |
| "max": 0.233787051406027, |
| "count": 100 |
| }, |
| "Pyramids.Policy.LearningRate.mean": { |
| "value": 1.506463783592856e-06, |
| "min": 1.506463783592856e-06, |
| "max": 0.00029838354339596195, |
| "count": 100 |
| }, |
| "Pyramids.Policy.LearningRate.sum": { |
| "value": 2.1090492970299984e-05, |
| "min": 2.1090492970299984e-05, |
| "max": 0.004072358742547132, |
| "count": 100 |
| }, |
| "Pyramids.Policy.Epsilon.mean": { |
| "value": 0.10050212142857143, |
| "min": 0.10050212142857143, |
| "max": 0.19946118095238097, |
| "count": 100 |
| }, |
| "Pyramids.Policy.Epsilon.sum": { |
| "value": 1.4070297, |
| "min": 1.3897045333333333, |
| "max": 2.8574528666666668, |
| "count": 100 |
| }, |
| "Pyramids.Policy.Beta.mean": { |
| "value": 6.016193071428568e-05, |
| "min": 6.016193071428568e-05, |
| "max": 0.009946171977142856, |
| "count": 100 |
| }, |
| "Pyramids.Policy.Beta.sum": { |
| "value": 0.0008422670299999995, |
| "min": 0.0008422670299999995, |
| "max": 0.13575954138, |
| "count": 100 |
| }, |
| "Pyramids.Losses.RNDLoss.mean": { |
| "value": 0.004812297411262989, |
| "min": 0.004657533951103687, |
| "max": 0.5557369589805603, |
| "count": 100 |
| }, |
| "Pyramids.Losses.RNDLoss.sum": { |
| "value": 0.067372165620327, |
| "min": 0.06520547717809677, |
| "max": 3.8901588916778564, |
| "count": 100 |
| }, |
| "Pyramids.Environment.EpisodeLength.mean": { |
| "value": 249.46031746031747, |
| "min": 213.3014705882353, |
| "max": 999.0, |
| "count": 100 |
| }, |
| "Pyramids.Environment.EpisodeLength.sum": { |
| "value": 31432.0, |
| "min": 15984.0, |
| "max": 32312.0, |
| "count": 100 |
| }, |
| "Pyramids.Environment.CumulativeReward.mean": { |
| "value": 1.7187904574804835, |
| "min": -1.0000000521540642, |
| "max": 1.7798248023664864, |
| "count": 100 |
| }, |
| "Pyramids.Environment.CumulativeReward.sum": { |
| "value": 216.56759764254093, |
| "min": -32.000001668930054, |
| "max": 243.83599792420864, |
| "count": 100 |
| }, |
| "Pyramids.Policy.ExtrinsicReward.mean": { |
| "value": 1.7187904574804835, |
| "min": -1.0000000521540642, |
| "max": 1.7798248023664864, |
| "count": 100 |
| }, |
| "Pyramids.Policy.ExtrinsicReward.sum": { |
| "value": 216.56759764254093, |
| "min": -32.000001668930054, |
| "max": 243.83599792420864, |
| "count": 100 |
| }, |
| "Pyramids.Policy.RndReward.mean": { |
| "value": 0.012556998638342882, |
| "min": 0.010937422458509365, |
| "max": 12.201441258192062, |
| "count": 100 |
| }, |
| "Pyramids.Policy.RndReward.sum": { |
| "value": 1.582181828431203, |
| "min": 1.426591651084891, |
| "max": 195.223060131073, |
| "count": 100 |
| }, |
| "Pyramids.IsTraining.mean": { |
| "value": 1.0, |
| "min": 1.0, |
| "max": 1.0, |
| "count": 100 |
| }, |
| "Pyramids.IsTraining.sum": { |
| "value": 1.0, |
| "min": 1.0, |
| "max": 1.0, |
| "count": 100 |
| } |
| }, |
| "metadata": { |
| "timer_format_version": "0.1.0", |
| "start_time_seconds": "1699953005", |
| "python_version": "3.10.3 (main, Mar 28 2022, 09:30:03) [GCC 7.5.0]", |
| "command_line_arguments": "/home/yzeng/anaconda3/envs/deeprl_course_unit5/bin/mlagents-learn ../config/ppo/PyramidsRND.yaml --env=./training-envs-executables/linux/Pyramids/Pyramids --run-id=Pyramids Training --no-graphics --force", |
| "mlagents_version": "1.1.0.dev0", |
| "mlagents_envs_version": "1.1.0.dev0", |
| "communication_protocol_version": "1.5.0", |
| "pytorch_version": "2.1.0+cu121", |
| "numpy_version": "1.23.5", |
| "end_time_seconds": "1699956693" |
| }, |
| "total": 3688.2422509463504, |
| "count": 1, |
| "self": 0.3199370610527694, |
| "children": { |
| "run_training.setup": { |
| "total": 0.01085307402536273, |
| "count": 1, |
| "self": 0.01085307402536273 |
| }, |
| "TrainerController.start_learning": { |
| "total": 3687.9114608112723, |
| "count": 1, |
| "self": 3.372778186108917, |
| "children": { |
| "TrainerController._reset_env": { |
| "total": 0.8616877705790102, |
| "count": 1, |
| "self": 0.8616877705790102 |
| }, |
| "TrainerController.advance": { |
| "total": 3683.61380162742, |
| "count": 194507, |
| "self": 3.364317771513015, |
| "children": { |
| "env_step": { |
| "total": 2322.2837941045873, |
| "count": 194507, |
| "self": 2124.274842475541, |
| "children": { |
| "SubprocessEnvManager._take_step": { |
| "total": 195.91820556716993, |
| "count": 194507, |
| "self": 9.23077730787918, |
| "children": { |
| "TorchPolicy.evaluate": { |
| "total": 186.68742825929075, |
| "count": 187562, |
| "self": 186.68742825929075 |
| } |
| } |
| }, |
| "workers": { |
| "total": 2.090746061876416, |
| "count": 194507, |
| "self": 0.0, |
| "children": { |
| "worker_root": { |
| "total": 3683.273943124339, |
| "count": 194507, |
| "is_parallel": true, |
| "self": 1784.8197832303122, |
| "children": { |
| "run_training.setup": { |
| "total": 0.0, |
| "count": 0, |
| "is_parallel": true, |
| "self": 0.0, |
| "children": { |
| "steps_from_proto": { |
| "total": 0.0012163030914962292, |
| "count": 1, |
| "is_parallel": true, |
| "self": 0.0003676139749586582, |
| "children": { |
| "_process_rank_one_or_two_observation": { |
| "total": 0.000848689116537571, |
| "count": 8, |
| "is_parallel": true, |
| "self": 0.000848689116537571 |
| } |
| } |
| }, |
| "UnityEnvironment.step": { |
| "total": 0.023782378993928432, |
| "count": 1, |
| "is_parallel": true, |
| "self": 0.00025271298363804817, |
| "children": { |
| "UnityEnvironment._generate_step_input": { |
| "total": 0.00029502203688025475, |
| "count": 1, |
| "is_parallel": true, |
| "self": 0.00029502203688025475 |
| }, |
| "communicator.exchange": { |
| "total": 0.02243240363895893, |
| "count": 1, |
| "is_parallel": true, |
| "self": 0.02243240363895893 |
| }, |
| "steps_from_proto": { |
| "total": 0.0008022403344511986, |
| "count": 1, |
| "is_parallel": true, |
| "self": 0.0001949523575603962, |
| "children": { |
| "_process_rank_one_or_two_observation": { |
| "total": 0.0006072879768908024, |
| "count": 8, |
| "is_parallel": true, |
| "self": 0.0006072879768908024 |
| } |
| } |
| } |
| } |
| } |
| } |
| }, |
| "UnityEnvironment.step": { |
| "total": 1898.4541598940268, |
| "count": 194506, |
| "is_parallel": true, |
| "self": 53.04335350031033, |
| "children": { |
| "UnityEnvironment._generate_step_input": { |
| "total": 39.29772320250049, |
| "count": 194506, |
| "is_parallel": true, |
| "self": 39.29772320250049 |
| }, |
| "communicator.exchange": { |
| "total": 1648.587595764082, |
| "count": 194506, |
| "is_parallel": true, |
| "self": 1648.587595764082 |
| }, |
| "steps_from_proto": { |
| "total": 157.52548742713407, |
| "count": 194506, |
| "is_parallel": true, |
| "self": 36.79078872175887, |
| "children": { |
| "_process_rank_one_or_two_observation": { |
| "total": 120.7346987053752, |
| "count": 1556048, |
| "is_parallel": true, |
| "self": 120.7346987053752 |
| } |
| } |
| } |
| } |
| } |
| } |
| } |
| } |
| } |
| } |
| }, |
| "trainer_advance": { |
| "total": 1357.9656897513196, |
| "count": 194507, |
| "self": 6.280239996500313, |
| "children": { |
| "process_trajectory": { |
| "total": 229.36559143615887, |
| "count": 194507, |
| "self": 228.95419924287125, |
| "children": { |
| "RLTrainer._checkpoint": { |
| "total": 0.411392193287611, |
| "count": 6, |
| "self": 0.411392193287611 |
| } |
| } |
| }, |
| "_update_policy": { |
| "total": 1122.3198583186604, |
| "count": 1396, |
| "self": 592.612791213207, |
| "children": { |
| "TorchPPOOptimizer.update": { |
| "total": 529.7070671054535, |
| "count": 68406, |
| "self": 529.7070671054535 |
| } |
| } |
| } |
| } |
| } |
| } |
| }, |
| "trainer_threads": { |
| "total": 9.122304618358612e-07, |
| "count": 1, |
| "self": 9.122304618358612e-07 |
| }, |
| "TrainerController._save_models": { |
| "total": 0.06319231493398547, |
| "count": 1, |
| "self": 0.0008483538404107094, |
| "children": { |
| "RLTrainer._checkpoint": { |
| "total": 0.06234396109357476, |
| "count": 1, |
| "self": 0.06234396109357476 |
| } |
| } |
| } |
| } |
| } |
| } |
| } |