| { |
| "name": "root", |
| "gauges": { |
| "Pyramids.Policy.Entropy.mean": { |
| "value": 0.18705493211746216, |
| "min": 0.16478247940540314, |
| "max": 0.44203102588653564, |
| "count": 33 |
| }, |
| "Pyramids.Policy.Entropy.sum": { |
| "value": 5605.662109375, |
| "min": 4938.201171875, |
| "max": 12799.0361328125, |
| "count": 33 |
| }, |
| "Pyramids.Environment.EpisodeLength.mean": { |
| "value": 240.1328125, |
| "min": 229.35245901639345, |
| "max": 336.12359550561797, |
| "count": 33 |
| }, |
| "Pyramids.Environment.EpisodeLength.sum": { |
| "value": 30737.0, |
| "min": 17589.0, |
| "max": 32323.0, |
| "count": 33 |
| }, |
| "Pyramids.Step.mean": { |
| "value": 1979907.0, |
| "min": 1019938.0, |
| "max": 1979907.0, |
| "count": 33 |
| }, |
| "Pyramids.Step.sum": { |
| "value": 1979907.0, |
| "min": 1019938.0, |
| "max": 1979907.0, |
| "count": 33 |
| }, |
| "Pyramids.Policy.ExtrinsicValueEstimate.mean": { |
| "value": 0.7753037214279175, |
| "min": 0.5842857956886292, |
| "max": 0.7826550602912903, |
| "count": 33 |
| }, |
| "Pyramids.Policy.ExtrinsicValueEstimate.sum": { |
| "value": 234.1417236328125, |
| "min": 112.94467163085938, |
| "max": 234.1417236328125, |
| "count": 33 |
| }, |
| "Pyramids.Policy.RndValueEstimate.mean": { |
| "value": 0.007218698039650917, |
| "min": -0.011078650131821632, |
| "max": 0.023848215118050575, |
| "count": 33 |
| }, |
| "Pyramids.Policy.RndValueEstimate.sum": { |
| "value": 2.180046796798706, |
| "min": -2.0495502948760986, |
| "max": 6.987526893615723, |
| "count": 33 |
| }, |
| "Pyramids.Environment.CumulativeReward.mean": { |
| "value": 1.7451243954380666, |
| "min": 1.5533956757956935, |
| "max": 1.7542524447695154, |
| "count": 33 |
| }, |
| "Pyramids.Environment.CumulativeReward.sum": { |
| "value": 221.63079822063446, |
| "min": 108.40999849885702, |
| "max": 221.63079822063446, |
| "count": 33 |
| }, |
| "Pyramids.Policy.ExtrinsicReward.mean": { |
| "value": 1.7451243954380666, |
| "min": 1.5533956757956935, |
| "max": 1.7542524447695154, |
| "count": 33 |
| }, |
| "Pyramids.Policy.ExtrinsicReward.sum": { |
| "value": 221.63079822063446, |
| "min": 108.40999849885702, |
| "max": 221.63079822063446, |
| "count": 33 |
| }, |
| "Pyramids.Policy.RndReward.mean": { |
| "value": 0.024534388826761254, |
| "min": 0.024235264870737006, |
| "max": 0.04270739211014271, |
| "count": 33 |
| }, |
| "Pyramids.Policy.RndReward.sum": { |
| "value": 3.1158673809986794, |
| "min": 2.254476272595639, |
| "max": 3.9742181365727447, |
| "count": 33 |
| }, |
| "Pyramids.Losses.PolicyLoss.mean": { |
| "value": 0.06661360270559921, |
| "min": 0.06401529681924904, |
| "max": 0.07187034715371694, |
| "count": 33 |
| }, |
| "Pyramids.Losses.PolicyLoss.sum": { |
| "value": 0.9325904378783889, |
| "min": 0.5761376713732413, |
| "max": 1.074378561701023, |
| "count": 33 |
| }, |
| "Pyramids.Losses.ValueLoss.mean": { |
| "value": 0.016130074523278467, |
| "min": 0.013827307654967978, |
| "max": 0.017788065528859278, |
| "count": 33 |
| }, |
| "Pyramids.Losses.ValueLoss.sum": { |
| "value": 0.22582104332589853, |
| "min": 0.141306401375914, |
| "max": 0.2668209829328892, |
| "count": 33 |
| }, |
| "Pyramids.Policy.LearningRate.mean": { |
| "value": 5.160880422596431e-06, |
| "min": 5.160880422596431e-06, |
| "max": 0.00014840945053020002, |
| "count": 33 |
| }, |
| "Pyramids.Policy.LearningRate.sum": { |
| "value": 7.225232591635003e-05, |
| "min": 7.225232591635003e-05, |
| "max": 0.0020269283743574503, |
| "count": 33 |
| }, |
| "Pyramids.Policy.Epsilon.mean": { |
| "value": 0.10172026071428573, |
| "min": 0.10172026071428573, |
| "max": 0.14946979999999999, |
| "count": 33 |
| }, |
| "Pyramids.Policy.Epsilon.sum": { |
| "value": 1.4240836500000003, |
| "min": 1.3452282, |
| "max": 2.1564575500000003, |
| "count": 33 |
| }, |
| "Pyramids.Policy.Beta.mean": { |
| "value": 0.00018185404535714294, |
| "min": 0.00018185404535714294, |
| "max": 0.004952033020000001, |
| "count": 33 |
| }, |
| "Pyramids.Policy.Beta.sum": { |
| "value": 0.002545956635000001, |
| "min": 0.002545956635000001, |
| "max": 0.06763669074499999, |
| "count": 33 |
| }, |
| "Pyramids.Losses.RNDLoss.mean": { |
| "value": 0.009958143346011639, |
| "min": 0.008901664055883884, |
| "max": 0.012760956771671772, |
| "count": 33 |
| }, |
| "Pyramids.Losses.RNDLoss.sum": { |
| "value": 0.1394140124320984, |
| "min": 0.11117810755968094, |
| "max": 0.1889527291059494, |
| "count": 33 |
| }, |
| "Pyramids.IsTraining.mean": { |
| "value": 1.0, |
| "min": 1.0, |
| "max": 1.0, |
| "count": 33 |
| }, |
| "Pyramids.IsTraining.sum": { |
| "value": 1.0, |
| "min": 1.0, |
| "max": 1.0, |
| "count": 33 |
| } |
| }, |
| "metadata": { |
| "timer_format_version": "0.1.0", |
| "start_time_seconds": "1711997790", |
| "python_version": "3.10.12 (main, Nov 20 2023, 15:14:05) [GCC 11.4.0]", |
| "command_line_arguments": "/usr/local/bin/mlagents-learn ./config/ppo/PyramidsRND.yaml --env=./training-envs-executables/linux/Pyramids/Pyramids --run-id=Pyramids Training --no-graphics --resume", |
| "mlagents_version": "1.1.0.dev0", |
| "mlagents_envs_version": "1.1.0.dev0", |
| "communication_protocol_version": "1.5.0", |
| "pytorch_version": "2.2.1+cu121", |
| "numpy_version": "1.23.5", |
| "end_time_seconds": "1712000308" |
| }, |
| "total": 2518.126583485, |
| "count": 1, |
| "self": 0.4756415490001018, |
| "children": { |
| "run_training.setup": { |
| "total": 0.049040627000067616, |
| "count": 1, |
| "self": 0.049040627000067616 |
| }, |
| "TrainerController.start_learning": { |
| "total": 2517.601901309, |
| "count": 1, |
| "self": 1.4609522070804815, |
| "children": { |
| "TrainerController._reset_env": { |
| "total": 2.0384117109997533, |
| "count": 1, |
| "self": 2.0384117109997533 |
| }, |
| "TrainerController.advance": { |
| "total": 2514.013688609919, |
| "count": 65417, |
| "self": 1.502925605067503, |
| "children": { |
| "env_step": { |
| "total": 1874.6336485859447, |
| "count": 65417, |
| "self": 1740.1902416718713, |
| "children": { |
| "SubprocessEnvManager._take_step": { |
| "total": 133.55975684108216, |
| "count": 65417, |
| "self": 4.7747069421711785, |
| "children": { |
| "TorchPolicy.evaluate": { |
| "total": 128.78504989891098, |
| "count": 62560, |
| "self": 128.78504989891098 |
| } |
| } |
| }, |
| "workers": { |
| "total": 0.8836500729912586, |
| "count": 65417, |
| "self": 0.0, |
| "children": { |
| "worker_root": { |
| "total": 2512.251911310238, |
| "count": 65417, |
| "is_parallel": true, |
| "self": 898.011206602202, |
| "children": { |
| "run_training.setup": { |
| "total": 0.0, |
| "count": 0, |
| "is_parallel": true, |
| "self": 0.0, |
| "children": { |
| "steps_from_proto": { |
| "total": 0.0022879790003571543, |
| "count": 1, |
| "is_parallel": true, |
| "self": 0.0006465400010711164, |
| "children": { |
| "_process_rank_one_or_two_observation": { |
| "total": 0.0016414389992860379, |
| "count": 8, |
| "is_parallel": true, |
| "self": 0.0016414389992860379 |
| } |
| } |
| }, |
| "UnityEnvironment.step": { |
| "total": 0.05712476000007882, |
| "count": 1, |
| "is_parallel": true, |
| "self": 0.0032920459989327355, |
| "children": { |
| "UnityEnvironment._generate_step_input": { |
| "total": 0.0004432969999470515, |
| "count": 1, |
| "is_parallel": true, |
| "self": 0.0004432969999470515 |
| }, |
| "communicator.exchange": { |
| "total": 0.05172769400087418, |
| "count": 1, |
| "is_parallel": true, |
| "self": 0.05172769400087418 |
| }, |
| "steps_from_proto": { |
| "total": 0.001661723000324855, |
| "count": 1, |
| "is_parallel": true, |
| "self": 0.0003732569985004375, |
| "children": { |
| "_process_rank_one_or_two_observation": { |
| "total": 0.0012884660018244176, |
| "count": 8, |
| "is_parallel": true, |
| "self": 0.0012884660018244176 |
| } |
| } |
| } |
| } |
| } |
| } |
| }, |
| "UnityEnvironment.step": { |
| "total": 1614.240704708036, |
| "count": 65416, |
| "is_parallel": true, |
| "self": 34.801910062221395, |
| "children": { |
| "UnityEnvironment._generate_step_input": { |
| "total": 24.99356799708312, |
| "count": 65416, |
| "is_parallel": true, |
| "self": 24.99356799708312 |
| }, |
| "communicator.exchange": { |
| "total": 1451.0625788657353, |
| "count": 65416, |
| "is_parallel": true, |
| "self": 1451.0625788657353 |
| }, |
| "steps_from_proto": { |
| "total": 103.38264778299617, |
| "count": 65416, |
| "is_parallel": true, |
| "self": 21.307672516118146, |
| "children": { |
| "_process_rank_one_or_two_observation": { |
| "total": 82.07497526687803, |
| "count": 523328, |
| "is_parallel": true, |
| "self": 82.07497526687803 |
| } |
| } |
| } |
| } |
| } |
| } |
| } |
| } |
| } |
| } |
| }, |
| "trainer_advance": { |
| "total": 637.8771144189068, |
| "count": 65417, |
| "self": 2.9310192950533747, |
| "children": { |
| "process_trajectory": { |
| "total": 135.03107008984261, |
| "count": 65417, |
| "self": 134.81534168884173, |
| "children": { |
| "RLTrainer._checkpoint": { |
| "total": 0.21572840100088797, |
| "count": 2, |
| "self": 0.21572840100088797 |
| } |
| } |
| }, |
| "_update_policy": { |
| "total": 499.9150250340108, |
| "count": 472, |
| "self": 294.54177497197907, |
| "children": { |
| "TorchPPOOptimizer.update": { |
| "total": 205.37325006203173, |
| "count": 22713, |
| "self": 205.37325006203173 |
| } |
| } |
| } |
| } |
| } |
| } |
| }, |
| "trainer_threads": { |
| "total": 8.400002116104588e-07, |
| "count": 1, |
| "self": 8.400002116104588e-07 |
| }, |
| "TrainerController._save_models": { |
| "total": 0.08884794100049476, |
| "count": 1, |
| "self": 0.0018642500008354546, |
| "children": { |
| "RLTrainer._checkpoint": { |
| "total": 0.0869836909996593, |
| "count": 1, |
| "self": 0.0869836909996593 |
| } |
| } |
| } |
| } |
| } |
| } |
| } |