| { |
| "name": "root", |
| "gauges": { |
| "Pyramids.Policy.Entropy.mean": { |
| "value": 0.4246387779712677, |
| "min": 0.4246387779712677, |
| "max": 1.4456040859222412, |
| "count": 33 |
| }, |
| "Pyramids.Policy.Entropy.sum": { |
| "value": 12773.134765625, |
| "min": 12773.134765625, |
| "max": 43853.84375, |
| "count": 33 |
| }, |
| "Pyramids.Step.mean": { |
| "value": 989926.0, |
| "min": 29952.0, |
| "max": 989926.0, |
| "count": 33 |
| }, |
| "Pyramids.Step.sum": { |
| "value": 989926.0, |
| "min": 29952.0, |
| "max": 989926.0, |
| "count": 33 |
| }, |
| "Pyramids.Policy.ExtrinsicValueEstimate.mean": { |
| "value": 0.5708710551261902, |
| "min": -0.061649616807699203, |
| "max": 0.6232691407203674, |
| "count": 33 |
| }, |
| "Pyramids.Policy.ExtrinsicValueEstimate.sum": { |
| "value": 157.56040954589844, |
| "min": -14.980856895446777, |
| "max": 177.00843811035156, |
| "count": 33 |
| }, |
| "Pyramids.Policy.RndValueEstimate.mean": { |
| "value": -0.04511358216404915, |
| "min": -0.04511358216404915, |
| "max": 0.7476927042007446, |
| "count": 33 |
| }, |
| "Pyramids.Policy.RndValueEstimate.sum": { |
| "value": -12.451348304748535, |
| "min": -12.451348304748535, |
| "max": 177.2031707763672, |
| "count": 33 |
| }, |
| "Pyramids.Losses.PolicyLoss.mean": { |
| "value": 0.06698757979708413, |
| "min": 0.06565299234630186, |
| "max": 0.07363895688415457, |
| "count": 33 |
| }, |
| "Pyramids.Losses.PolicyLoss.sum": { |
| "value": 1.004813696956262, |
| "min": 0.5150413518054303, |
| "max": 1.0925647304781403, |
| "count": 33 |
| }, |
| "Pyramids.Losses.ValueLoss.mean": { |
| "value": 0.017095749339794897, |
| "min": 0.0012846800181240889, |
| "max": 0.02962426979588816, |
| "count": 33 |
| }, |
| "Pyramids.Losses.ValueLoss.sum": { |
| "value": 0.25643624009692345, |
| "min": 0.012846800181240889, |
| "max": 0.25643624009692345, |
| "count": 33 |
| }, |
| "Pyramids.Policy.LearningRate.mean": { |
| "value": 7.552817482426668e-06, |
| "min": 7.552817482426668e-06, |
| "max": 0.00029515063018788575, |
| "count": 33 |
| }, |
| "Pyramids.Policy.LearningRate.sum": { |
| "value": 0.00011329226223640002, |
| "min": 0.00011329226223640002, |
| "max": 0.0036347473884176, |
| "count": 33 |
| }, |
| "Pyramids.Policy.Epsilon.mean": { |
| "value": 0.10251757333333332, |
| "min": 0.10251757333333332, |
| "max": 0.19838354285714285, |
| "count": 33 |
| }, |
| "Pyramids.Policy.Epsilon.sum": { |
| "value": 1.5377636, |
| "min": 1.3886848, |
| "max": 2.6623066, |
| "count": 33 |
| }, |
| "Pyramids.Policy.Beta.mean": { |
| "value": 0.000261505576, |
| "min": 0.000261505576, |
| "max": 0.00983851593142857, |
| "count": 33 |
| }, |
| "Pyramids.Policy.Beta.sum": { |
| "value": 0.00392258364, |
| "min": 0.00392258364, |
| "max": 0.12117708176000001, |
| "count": 33 |
| }, |
| "Pyramids.Losses.RNDLoss.mean": { |
| "value": 0.014357751235365868, |
| "min": 0.014245187863707542, |
| "max": 0.8657411932945251, |
| "count": 33 |
| }, |
| "Pyramids.Losses.RNDLoss.sum": { |
| "value": 0.21536627411842346, |
| "min": 0.1994326263666153, |
| "max": 6.060188293457031, |
| "count": 33 |
| }, |
| "Pyramids.Environment.EpisodeLength.mean": { |
| "value": 320.40425531914894, |
| "min": 298.7755102040816, |
| "max": 999.0, |
| "count": 33 |
| }, |
| "Pyramids.Environment.EpisodeLength.sum": { |
| "value": 30118.0, |
| "min": 15984.0, |
| "max": 32950.0, |
| "count": 33 |
| }, |
| "Pyramids.Environment.CumulativeReward.mean": { |
| "value": 1.6571139593919118, |
| "min": -1.0000000521540642, |
| "max": 1.6826123519963825, |
| "count": 33 |
| }, |
| "Pyramids.Environment.CumulativeReward.sum": { |
| "value": 154.1115982234478, |
| "min": -30.753001734614372, |
| "max": 163.2133981436491, |
| "count": 33 |
| }, |
| "Pyramids.Policy.ExtrinsicReward.mean": { |
| "value": 1.6571139593919118, |
| "min": -1.0000000521540642, |
| "max": 1.6826123519963825, |
| "count": 33 |
| }, |
| "Pyramids.Policy.ExtrinsicReward.sum": { |
| "value": 154.1115982234478, |
| "min": -30.753001734614372, |
| "max": 163.2133981436491, |
| "count": 33 |
| }, |
| "Pyramids.Policy.RndReward.mean": { |
| "value": 0.04798846740353232, |
| "min": 0.044617075882173986, |
| "max": 19.5529414601624, |
| "count": 33 |
| }, |
| "Pyramids.Policy.RndReward.sum": { |
| "value": 4.462927468528505, |
| "min": 4.205655123165343, |
| "max": 312.8470633625984, |
| "count": 33 |
| }, |
| "Pyramids.IsTraining.mean": { |
| "value": 1.0, |
| "min": 1.0, |
| "max": 1.0, |
| "count": 33 |
| }, |
| "Pyramids.IsTraining.sum": { |
| "value": 1.0, |
| "min": 1.0, |
| "max": 1.0, |
| "count": 33 |
| } |
| }, |
| "metadata": { |
| "timer_format_version": "0.1.0", |
| "start_time_seconds": "1768143178", |
| "python_version": "3.10.12 (main, Jul 5 2023, 18:54:27) [GCC 11.2.0]", |
| "command_line_arguments": "/home/ruedi/miniconda3/envs/deep-rl-unit5/bin/mlagents-learn ./config/ppo/PyramidsRND.yaml --env=./training-envs-executables/linux/Pyramids/Pyramids --run-id=Pyramids Training --no-graphics", |
| "mlagents_version": "1.2.0.dev0", |
| "mlagents_envs_version": "1.2.0.dev0", |
| "communication_protocol_version": "1.5.0", |
| "pytorch_version": "2.7.1+cu118", |
| "numpy_version": "1.23.5", |
| "end_time_seconds": "1768144877" |
| }, |
| "total": 1699.4481448590013, |
| "count": 1, |
| "self": 0.32161057400298887, |
| "children": { |
| "run_training.setup": { |
| "total": 0.0265691769982368, |
| "count": 1, |
| "self": 0.0265691769982368 |
| }, |
| "TrainerController.start_learning": { |
| "total": 1699.099965108, |
| "count": 1, |
| "self": 1.0126069420657586, |
| "children": { |
| "TrainerController._reset_env": { |
| "total": 2.489544700998522, |
| "count": 1, |
| "self": 2.489544700998522 |
| }, |
| "TrainerController.advance": { |
| "total": 1695.5144028799386, |
| "count": 64098, |
| "self": 1.0758791520038358, |
| "children": { |
| "env_step": { |
| "total": 1034.170596157328, |
| "count": 64098, |
| "self": 900.9851592079485, |
| "children": { |
| "SubprocessEnvManager._take_step": { |
| "total": 132.5512001971092, |
| "count": 64098, |
| "self": 3.4022758224764402, |
| "children": { |
| "TorchPolicy.evaluate": { |
| "total": 129.14892437463277, |
| "count": 62552, |
| "self": 129.14892437463277 |
| } |
| } |
| }, |
| "workers": { |
| "total": 0.6342367522702261, |
| "count": 64098, |
| "self": 0.0, |
| "children": { |
| "worker_root": { |
| "total": 1696.8730614146843, |
| "count": 64098, |
| "is_parallel": true, |
| "self": 883.3339461736832, |
| "children": { |
| "run_training.setup": { |
| "total": 0.0, |
| "count": 0, |
| "is_parallel": true, |
| "self": 0.0, |
| "children": { |
| "steps_from_proto": { |
| "total": 0.002434030999211245, |
| "count": 1, |
| "is_parallel": true, |
| "self": 0.0005315310008882079, |
| "children": { |
| "_process_rank_one_or_two_observation": { |
| "total": 0.0019024999983230373, |
| "count": 8, |
| "is_parallel": true, |
| "self": 0.0019024999983230373 |
| } |
| } |
| }, |
| "UnityEnvironment.step": { |
| "total": 0.04527939900071942, |
| "count": 1, |
| "is_parallel": true, |
| "self": 0.0008197250008379342, |
| "children": { |
| "UnityEnvironment._generate_step_input": { |
| "total": 0.00027776099886978045, |
| "count": 1, |
| "is_parallel": true, |
| "self": 0.00027776099886978045 |
| }, |
| "communicator.exchange": { |
| "total": 0.042582305999530945, |
| "count": 1, |
| "is_parallel": true, |
| "self": 0.042582305999530945 |
| }, |
| "steps_from_proto": { |
| "total": 0.0015996070014807628, |
| "count": 1, |
| "is_parallel": true, |
| "self": 0.00027805700119643006, |
| "children": { |
| "_process_rank_one_or_two_observation": { |
| "total": 0.0013215500002843328, |
| "count": 8, |
| "is_parallel": true, |
| "self": 0.0013215500002843328 |
| } |
| } |
| } |
| } |
| } |
| } |
| }, |
| "UnityEnvironment.step": { |
| "total": 813.5391152410011, |
| "count": 64097, |
| "is_parallel": true, |
| "self": 29.240099724700485, |
| "children": { |
| "UnityEnvironment._generate_step_input": { |
| "total": 20.409567403163237, |
| "count": 64097, |
| "is_parallel": true, |
| "self": 20.409567403163237 |
| }, |
| "communicator.exchange": { |
| "total": 674.0780032838593, |
| "count": 64097, |
| "is_parallel": true, |
| "self": 674.0780032838593 |
| }, |
| "steps_from_proto": { |
| "total": 89.81144482927812, |
| "count": 64097, |
| "is_parallel": true, |
| "self": 19.6907945834173, |
| "children": { |
| "_process_rank_one_or_two_observation": { |
| "total": 70.12065024586082, |
| "count": 512776, |
| "is_parallel": true, |
| "self": 70.12065024586082 |
| } |
| } |
| } |
| } |
| } |
| } |
| } |
| } |
| } |
| } |
| }, |
| "trainer_advance": { |
| "total": 660.2679275706068, |
| "count": 64098, |
| "self": 1.7409405515463732, |
| "children": { |
| "process_trajectory": { |
| "total": 109.60059068708506, |
| "count": 64098, |
| "self": 109.42354976508796, |
| "children": { |
| "RLTrainer._checkpoint": { |
| "total": 0.1770409219971043, |
| "count": 2, |
| "self": 0.1770409219971043 |
| } |
| } |
| }, |
| "_update_policy": { |
| "total": 548.9263963319754, |
| "count": 453, |
| "self": 265.25873213222076, |
| "children": { |
| "TorchPPOOptimizer.update": { |
| "total": 283.66766419975465, |
| "count": 22752, |
| "self": 283.66766419975465 |
| } |
| } |
| } |
| } |
| } |
| } |
| }, |
| "trainer_threads": { |
| "total": 8.049973985180259e-07, |
| "count": 1, |
| "self": 8.049973985180259e-07 |
| }, |
| "TrainerController._save_models": { |
| "total": 0.0834097799997835, |
| "count": 1, |
| "self": 0.0009502159991825465, |
| "children": { |
| "RLTrainer._checkpoint": { |
| "total": 0.08245956400060095, |
| "count": 1, |
| "self": 0.08245956400060095 |
| } |
| } |
| } |
| } |
| } |
| } |
| } |