| { |
| "name": "root", |
| "gauges": { |
| "Pyramids.Policy.Entropy.mean": { |
| "value": 0.4227753281593323, |
| "min": 0.4227753281593323, |
| "max": 1.4035130739212036, |
| "count": 33 |
| }, |
| "Pyramids.Policy.Entropy.sum": { |
| "value": 12662.966796875, |
| "min": 12662.966796875, |
| "max": 42576.97265625, |
| "count": 33 |
| }, |
| "Pyramids.Step.mean": { |
| "value": 989935.0, |
| "min": 29891.0, |
| "max": 989935.0, |
| "count": 33 |
| }, |
| "Pyramids.Step.sum": { |
| "value": 989935.0, |
| "min": 29891.0, |
| "max": 989935.0, |
| "count": 33 |
| }, |
| "Pyramids.Policy.ExtrinsicValueEstimate.mean": { |
| "value": 0.5472075343132019, |
| "min": -0.08480988442897797, |
| "max": 0.5472075343132019, |
| "count": 33 |
| }, |
| "Pyramids.Policy.ExtrinsicValueEstimate.sum": { |
| "value": 149.38766479492188, |
| "min": -20.43918228149414, |
| "max": 149.38766479492188, |
| "count": 33 |
| }, |
| "Pyramids.Policy.RndValueEstimate.mean": { |
| "value": -0.5827062129974365, |
| "min": -0.5827062129974365, |
| "max": 0.7334055304527283, |
| "count": 33 |
| }, |
| "Pyramids.Policy.RndValueEstimate.sum": { |
| "value": -159.07879638671875, |
| "min": -159.07879638671875, |
| "max": 173.81710815429688, |
| "count": 33 |
| }, |
| "Pyramids.Losses.PolicyLoss.mean": { |
| "value": 0.06880309737295778, |
| "min": 0.06303410240728963, |
| "max": 0.07338600206421689, |
| "count": 33 |
| }, |
| "Pyramids.Losses.PolicyLoss.sum": { |
| "value": 0.9632433632214089, |
| "min": 0.5121669554644687, |
| "max": 1.1007900309632532, |
| "count": 33 |
| }, |
| "Pyramids.Losses.ValueLoss.mean": { |
| "value": 0.053455584703312665, |
| "min": 0.0018368665227186263, |
| "max": 0.053455584703312665, |
| "count": 33 |
| }, |
| "Pyramids.Losses.ValueLoss.sum": { |
| "value": 0.7483781858463773, |
| "min": 0.022042398272623515, |
| "max": 0.7483781858463773, |
| "count": 33 |
| }, |
| "Pyramids.Policy.LearningRate.mean": { |
| "value": 7.547840341228574e-06, |
| "min": 7.547840341228574e-06, |
| "max": 0.0002952355301595857, |
| "count": 33 |
| }, |
| "Pyramids.Policy.LearningRate.sum": { |
| "value": 0.00010566976477720003, |
| "min": 0.00010566976477720003, |
| "max": 0.0036344419885193996, |
| "count": 33 |
| }, |
| "Pyramids.Policy.Epsilon.mean": { |
| "value": 0.10251591428571429, |
| "min": 0.10251591428571429, |
| "max": 0.19841184285714286, |
| "count": 33 |
| }, |
| "Pyramids.Policy.Epsilon.sum": { |
| "value": 1.4352228, |
| "min": 1.3888829, |
| "max": 2.6114806000000006, |
| "count": 33 |
| }, |
| "Pyramids.Policy.Beta.mean": { |
| "value": 0.00026133983714285723, |
| "min": 0.00026133983714285723, |
| "max": 0.009841343101428571, |
| "count": 33 |
| }, |
| "Pyramids.Policy.Beta.sum": { |
| "value": 0.0036587577200000014, |
| "min": 0.0036587577200000014, |
| "max": 0.12116691194, |
| "count": 33 |
| }, |
| "Pyramids.Losses.RNDLoss.mean": { |
| "value": 0.013660682365298271, |
| "min": 0.013217068277299404, |
| "max": 0.6735454797744751, |
| "count": 33 |
| }, |
| "Pyramids.Losses.RNDLoss.sum": { |
| "value": 0.1912495493888855, |
| "min": 0.1850389540195465, |
| "max": 4.714818477630615, |
| "count": 33 |
| }, |
| "Pyramids.Environment.EpisodeLength.mean": { |
| "value": 351.07954545454544, |
| "min": 349.4022988505747, |
| "max": 983.1515151515151, |
| "count": 33 |
| }, |
| "Pyramids.Environment.EpisodeLength.sum": { |
| "value": 30895.0, |
| "min": 16690.0, |
| "max": 32444.0, |
| "count": 33 |
| }, |
| "Pyramids.Environment.CumulativeReward.mean": { |
| "value": 1.557974978858097, |
| "min": -0.8650588735061533, |
| "max": 1.6218430201841305, |
| "count": 33 |
| }, |
| "Pyramids.Environment.CumulativeReward.sum": { |
| "value": 137.10179813951254, |
| "min": -28.474001720547676, |
| "max": 137.10179813951254, |
| "count": 33 |
| }, |
| "Pyramids.Policy.ExtrinsicReward.mean": { |
| "value": 1.557974978858097, |
| "min": -0.8650588735061533, |
| "max": 1.6218430201841305, |
| "count": 33 |
| }, |
| "Pyramids.Policy.ExtrinsicReward.sum": { |
| "value": 137.10179813951254, |
| "min": -28.474001720547676, |
| "max": 137.10179813951254, |
| "count": 33 |
| }, |
| "Pyramids.Policy.RndReward.mean": { |
| "value": 0.04995945484221342, |
| "min": 0.04917197070064876, |
| "max": 13.278092069660916, |
| "count": 33 |
| }, |
| "Pyramids.Policy.RndReward.sum": { |
| "value": 4.3964320261147805, |
| "min": 3.935927780577913, |
| "max": 225.72756518423557, |
| "count": 33 |
| }, |
| "Pyramids.IsTraining.mean": { |
| "value": 1.0, |
| "min": 1.0, |
| "max": 1.0, |
| "count": 33 |
| }, |
| "Pyramids.IsTraining.sum": { |
| "value": 1.0, |
| "min": 1.0, |
| "max": 1.0, |
| "count": 33 |
| } |
| }, |
| "metadata": { |
| "timer_format_version": "0.1.0", |
| "start_time_seconds": "1756135625", |
| "python_version": "3.10.12 (main, Aug 15 2025, 14:32:43) [GCC 11.4.0]", |
| "command_line_arguments": "/home/ubuntu/.local/bin/mlagents-learn ./ml-agents/config/ppo/PyramidsRND.yaml --env=./ml-agents/training-envs-executables/linux/Pyramids/Pyramids --run-id=Pyramids Training --no-graphics --force", |
| "mlagents_version": "1.1.0", |
| "mlagents_envs_version": "1.1.0", |
| "communication_protocol_version": "1.5.0", |
| "pytorch_version": "2.8.0+cu128", |
| "numpy_version": "1.23.5", |
| "end_time_seconds": "1756136428" |
| }, |
| "total": 802.8712916290001, |
| "count": 1, |
| "self": 0.2177329070000269, |
| "children": { |
| "run_training.setup": { |
| "total": 0.01570750200016846, |
| "count": 1, |
| "self": 0.01570750200016846 |
| }, |
| "TrainerController.start_learning": { |
| "total": 802.6378512199999, |
| "count": 1, |
| "self": 0.6336360961258833, |
| "children": { |
| "TrainerController._reset_env": { |
| "total": 1.1959457339999062, |
| "count": 1, |
| "self": 1.1959457339999062 |
| }, |
| "TrainerController.advance": { |
| "total": 800.7609756408747, |
| "count": 63862, |
| "self": 0.5845655628495479, |
| "children": { |
| "env_step": { |
| "total": 501.1566706939698, |
| "count": 63862, |
| "self": 435.2795409839355, |
| "children": { |
| "SubprocessEnvManager._take_step": { |
| "total": 65.46808117204228, |
| "count": 63862, |
| "self": 2.05530309798678, |
| "children": { |
| "TorchPolicy.evaluate": { |
| "total": 63.412778074055495, |
| "count": 62550, |
| "self": 63.412778074055495 |
| } |
| } |
| }, |
| "workers": { |
| "total": 0.409048537992021, |
| "count": 63862, |
| "self": 0.0, |
| "children": { |
| "worker_root": { |
| "total": 801.4139665399616, |
| "count": 63862, |
| "is_parallel": true, |
| "self": 410.96247375195344, |
| "children": { |
| "run_training.setup": { |
| "total": 0.0, |
| "count": 0, |
| "is_parallel": true, |
| "self": 0.0, |
| "children": { |
| "steps_from_proto": { |
| "total": 0.0011772079997172114, |
| "count": 1, |
| "is_parallel": true, |
| "self": 0.0003702619983414479, |
| "children": { |
| "_process_rank_one_or_two_observation": { |
| "total": 0.0008069460013757634, |
| "count": 8, |
| "is_parallel": true, |
| "self": 0.0008069460013757634 |
| } |
| } |
| }, |
| "UnityEnvironment.step": { |
| "total": 0.017153541999959998, |
| "count": 1, |
| "is_parallel": true, |
| "self": 0.00016109099988170783, |
| "children": { |
| "UnityEnvironment._generate_step_input": { |
| "total": 0.0001901410000755277, |
| "count": 1, |
| "is_parallel": true, |
| "self": 0.0001901410000755277 |
| }, |
| "communicator.exchange": { |
| "total": 0.016252166999947804, |
| "count": 1, |
| "is_parallel": true, |
| "self": 0.016252166999947804 |
| }, |
| "steps_from_proto": { |
| "total": 0.000550143000054959, |
| "count": 1, |
| "is_parallel": true, |
| "self": 0.00012821100062865298, |
| "children": { |
| "_process_rank_one_or_two_observation": { |
| "total": 0.000421931999426306, |
| "count": 8, |
| "is_parallel": true, |
| "self": 0.000421931999426306 |
| } |
| } |
| } |
| } |
| } |
| } |
| }, |
| "UnityEnvironment.step": { |
| "total": 390.4514927880082, |
| "count": 63861, |
| "is_parallel": true, |
| "self": 9.907689546058464, |
| "children": { |
| "UnityEnvironment._generate_step_input": { |
| "total": 6.942700701885769, |
| "count": 63861, |
| "is_parallel": true, |
| "self": 6.942700701885769 |
| }, |
| "communicator.exchange": { |
| "total": 344.84160323801643, |
| "count": 63861, |
| "is_parallel": true, |
| "self": 344.84160323801643 |
| }, |
| "steps_from_proto": { |
| "total": 28.759499302047516, |
| "count": 63861, |
| "is_parallel": true, |
| "self": 5.987972682886721, |
| "children": { |
| "_process_rank_one_or_two_observation": { |
| "total": 22.771526619160795, |
| "count": 510888, |
| "is_parallel": true, |
| "self": 22.771526619160795 |
| } |
| } |
| } |
| } |
| } |
| } |
| } |
| } |
| } |
| } |
| }, |
| "trainer_advance": { |
| "total": 299.01973938405536, |
| "count": 63862, |
| "self": 1.283134781041099, |
| "children": { |
| "process_trajectory": { |
| "total": 58.892194951010424, |
| "count": 63862, |
| "self": 58.78063713501024, |
| "children": { |
| "RLTrainer._checkpoint": { |
| "total": 0.111557816000186, |
| "count": 2, |
| "self": 0.111557816000186 |
| } |
| } |
| }, |
| "_update_policy": { |
| "total": 238.84440965200383, |
| "count": 458, |
| "self": 138.19577779496603, |
| "children": { |
| "TorchPPOOptimizer.update": { |
| "total": 100.6486318570378, |
| "count": 22794, |
| "self": 100.6486318570378 |
| } |
| } |
| } |
| } |
| } |
| } |
| }, |
| "trainer_threads": { |
| "total": 6.199998097144999e-07, |
| "count": 1, |
| "self": 6.199998097144999e-07 |
| }, |
| "TrainerController._save_models": { |
| "total": 0.04729312899962679, |
| "count": 1, |
| "self": 0.0013493499996002356, |
| "children": { |
| "RLTrainer._checkpoint": { |
| "total": 0.04594377900002655, |
| "count": 1, |
| "self": 0.04594377900002655 |
| } |
| } |
| } |
| } |
| } |
| } |
| } |