| { |
| "name": "root", |
| "gauges": { |
| "Pyramids.Policy.Entropy.mean": { |
| "value": 0.38749825954437256, |
| "min": 0.38617178797721863, |
| "max": 1.4779518842697144, |
| "count": 33 |
| }, |
| "Pyramids.Policy.Entropy.sum": { |
| "value": 11550.5478515625, |
| "min": 11550.5478515625, |
| "max": 44835.1484375, |
| "count": 33 |
| }, |
| "Pyramids.Step.mean": { |
| "value": 989899.0, |
| "min": 29908.0, |
| "max": 989899.0, |
| "count": 33 |
| }, |
| "Pyramids.Step.sum": { |
| "value": 989899.0, |
| "min": 29908.0, |
| "max": 989899.0, |
| "count": 33 |
| }, |
| "Pyramids.Policy.ExtrinsicValueEstimate.mean": { |
| "value": 0.37798383831977844, |
| "min": -0.09477484226226807, |
| "max": 0.4683753252029419, |
| "count": 33 |
| }, |
| "Pyramids.Policy.ExtrinsicValueEstimate.sum": { |
| "value": 101.29966735839844, |
| "min": -22.840736389160156, |
| "max": 126.46133422851562, |
| "count": 33 |
| }, |
| "Pyramids.Policy.RndValueEstimate.mean": { |
| "value": -0.0241877231746912, |
| "min": -0.031342942267656326, |
| "max": 0.2993612289428711, |
| "count": 33 |
| }, |
| "Pyramids.Policy.RndValueEstimate.sum": { |
| "value": -6.482309818267822, |
| "min": -8.462594032287598, |
| "max": 70.9486083984375, |
| "count": 33 |
| }, |
| "Pyramids.Losses.PolicyLoss.mean": { |
| "value": 0.07015097327772915, |
| "min": 0.06414965563355765, |
| "max": 0.07358444599493918, |
| "count": 33 |
| }, |
| "Pyramids.Losses.PolicyLoss.sum": { |
| "value": 0.9821136258882082, |
| "min": 0.4490475894349036, |
| "max": 1.1001935511548984, |
| "count": 33 |
| }, |
| "Pyramids.Losses.ValueLoss.mean": { |
| "value": 0.013804367392454187, |
| "min": 0.0005465998558006482, |
| "max": 0.01438293275423348, |
| "count": 33 |
| }, |
| "Pyramids.Losses.ValueLoss.sum": { |
| "value": 0.1932611434943586, |
| "min": 0.004919398702205834, |
| "max": 0.21574399131350222, |
| "count": 33 |
| }, |
| "Pyramids.Policy.LearningRate.mean": { |
| "value": 7.482118934564283e-06, |
| "min": 7.482118934564283e-06, |
| "max": 0.0002952348015884, |
| "count": 33 |
| }, |
| "Pyramids.Policy.LearningRate.sum": { |
| "value": 0.00010474966508389996, |
| "min": 0.00010474966508389996, |
| "max": 0.0035078921307027, |
| "count": 33 |
| }, |
| "Pyramids.Policy.Epsilon.mean": { |
| "value": 0.10249400714285715, |
| "min": 0.10249400714285715, |
| "max": 0.1984116, |
| "count": 33 |
| }, |
| "Pyramids.Policy.Epsilon.sum": { |
| "value": 1.4349161000000001, |
| "min": 1.3888812, |
| "max": 2.5692973, |
| "count": 33 |
| }, |
| "Pyramids.Policy.Beta.mean": { |
| "value": 0.0002591513135714285, |
| "min": 0.0002591513135714285, |
| "max": 0.00984131884, |
| "count": 33 |
| }, |
| "Pyramids.Policy.Beta.sum": { |
| "value": 0.0036281183899999985, |
| "min": 0.0036281183899999985, |
| "max": 0.11695280027, |
| "count": 33 |
| }, |
| "Pyramids.Losses.RNDLoss.mean": { |
| "value": 0.011420076712965965, |
| "min": 0.011420076712965965, |
| "max": 0.5271530747413635, |
| "count": 33 |
| }, |
| "Pyramids.Losses.RNDLoss.sum": { |
| "value": 0.15988107025623322, |
| "min": 0.15988107025623322, |
| "max": 3.6900713443756104, |
| "count": 33 |
| }, |
| "Pyramids.Environment.EpisodeLength.mean": { |
| "value": 467.7971014492754, |
| "min": 401.64383561643837, |
| "max": 999.0, |
| "count": 33 |
| }, |
| "Pyramids.Environment.EpisodeLength.sum": { |
| "value": 32278.0, |
| "min": 16707.0, |
| "max": 32278.0, |
| "count": 33 |
| }, |
| "Pyramids.Environment.CumulativeReward.mean": { |
| "value": 1.2712347583062407, |
| "min": -1.0000000521540642, |
| "max": 1.486647345517811, |
| "count": 33 |
| }, |
| "Pyramids.Environment.CumulativeReward.sum": { |
| "value": 87.71519832313061, |
| "min": -32.000001668930054, |
| "max": 112.98519825935364, |
| "count": 33 |
| }, |
| "Pyramids.Policy.ExtrinsicReward.mean": { |
| "value": 1.2712347583062407, |
| "min": -1.0000000521540642, |
| "max": 1.486647345517811, |
| "count": 33 |
| }, |
| "Pyramids.Policy.ExtrinsicReward.sum": { |
| "value": 87.71519832313061, |
| "min": -32.000001668930054, |
| "max": 112.98519825935364, |
| "count": 33 |
| }, |
| "Pyramids.Policy.RndReward.mean": { |
| "value": 0.05505368986801393, |
| "min": 0.048350382187522516, |
| "max": 10.450664348462048, |
| "count": 33 |
| }, |
| "Pyramids.Policy.RndReward.sum": { |
| "value": 3.798704600892961, |
| "min": 3.577928281876666, |
| "max": 177.66129392385483, |
| "count": 33 |
| }, |
| "Pyramids.IsTraining.mean": { |
| "value": 1.0, |
| "min": 1.0, |
| "max": 1.0, |
| "count": 33 |
| }, |
| "Pyramids.IsTraining.sum": { |
| "value": 1.0, |
| "min": 1.0, |
| "max": 1.0, |
| "count": 33 |
| } |
| }, |
| "metadata": { |
| "timer_format_version": "0.1.0", |
| "start_time_seconds": "1747904210", |
| "python_version": "3.10.12 (main, Jul 5 2023, 18:54:27) [GCC 11.2.0]", |
| "command_line_arguments": "/usr/local/bin/mlagents-learn ./config/ppo/PyramidsRND.yaml --env=./training-envs-executables/linux/Pyramids/Pyramids --run-id=Pyramids Training --no-graphics", |
| "mlagents_version": "1.2.0.dev0", |
| "mlagents_envs_version": "1.2.0.dev0", |
| "communication_protocol_version": "1.5.0", |
| "pytorch_version": "2.7.0+cu126", |
| "numpy_version": "1.23.5", |
| "end_time_seconds": "1747907275" |
| }, |
| "total": 3064.326325808, |
| "count": 1, |
| "self": 0.5930943060006939, |
| "children": { |
| "run_training.setup": { |
| "total": 0.036050697999598924, |
| "count": 1, |
| "self": 0.036050697999598924 |
| }, |
| "TrainerController.start_learning": { |
| "total": 3063.697180804, |
| "count": 1, |
| "self": 2.413947020057094, |
| "children": { |
| "TrainerController._reset_env": { |
| "total": 4.522547317999852, |
| "count": 1, |
| "self": 4.522547317999852 |
| }, |
| "TrainerController.advance": { |
| "total": 3056.676068109943, |
| "count": 63762, |
| "self": 2.54273445504532, |
| "children": { |
| "env_step": { |
| "total": 2019.632045587955, |
| "count": 63762, |
| "self": 1861.8729795300887, |
| "children": { |
| "SubprocessEnvManager._take_step": { |
| "total": 156.35573263386868, |
| "count": 63762, |
| "self": 6.8219189418614405, |
| "children": { |
| "TorchPolicy.evaluate": { |
| "total": 149.53381369200724, |
| "count": 62569, |
| "self": 149.53381369200724 |
| } |
| } |
| }, |
| "workers": { |
| "total": 1.4033334239975375, |
| "count": 63762, |
| "self": 0.0, |
| "children": { |
| "worker_root": { |
| "total": 3056.4151284029163, |
| "count": 63762, |
| "is_parallel": true, |
| "self": 1366.5519604488477, |
| "children": { |
| "run_training.setup": { |
| "total": 0.0, |
| "count": 0, |
| "is_parallel": true, |
| "self": 0.0, |
| "children": { |
| "steps_from_proto": { |
| "total": 0.003977787999701832, |
| "count": 1, |
| "is_parallel": true, |
| "self": 0.0015183109994723054, |
| "children": { |
| "_process_rank_one_or_two_observation": { |
| "total": 0.0024594770002295263, |
| "count": 8, |
| "is_parallel": true, |
| "self": 0.0024594770002295263 |
| } |
| } |
| }, |
| "UnityEnvironment.step": { |
| "total": 0.22586353599990616, |
| "count": 1, |
| "is_parallel": true, |
| "self": 0.004402599999593804, |
| "children": { |
| "UnityEnvironment._generate_step_input": { |
| "total": 0.0007351910003308149, |
| "count": 1, |
| "is_parallel": true, |
| "self": 0.0007351910003308149 |
| }, |
| "communicator.exchange": { |
| "total": 0.19935630000009041, |
| "count": 1, |
| "is_parallel": true, |
| "self": 0.19935630000009041 |
| }, |
| "steps_from_proto": { |
| "total": 0.02136944499989113, |
| "count": 1, |
| "is_parallel": true, |
| "self": 0.005143133999808924, |
| "children": { |
| "_process_rank_one_or_two_observation": { |
| "total": 0.016226311000082205, |
| "count": 8, |
| "is_parallel": true, |
| "self": 0.016226311000082205 |
| } |
| } |
| } |
| } |
| } |
| } |
| }, |
| "UnityEnvironment.step": { |
| "total": 1689.8631679540686, |
| "count": 63761, |
| "is_parallel": true, |
| "self": 45.12232580395721, |
| "children": { |
| "UnityEnvironment._generate_step_input": { |
| "total": 30.770029259028433, |
| "count": 63761, |
| "is_parallel": true, |
| "self": 30.770029259028433 |
| }, |
| "communicator.exchange": { |
| "total": 1487.2160940550184, |
| "count": 63761, |
| "is_parallel": true, |
| "self": 1487.2160940550184 |
| }, |
| "steps_from_proto": { |
| "total": 126.75471883606451, |
| "count": 63761, |
| "is_parallel": true, |
| "self": 27.568633068331565, |
| "children": { |
| "_process_rank_one_or_two_observation": { |
| "total": 99.18608576773295, |
| "count": 510088, |
| "is_parallel": true, |
| "self": 99.18608576773295 |
| } |
| } |
| } |
| } |
| } |
| } |
| } |
| } |
| } |
| } |
| }, |
| "trainer_advance": { |
| "total": 1034.5012880669428, |
| "count": 63762, |
| "self": 4.350158363921764, |
| "children": { |
| "process_trajectory": { |
| "total": 161.9294855840185, |
| "count": 63762, |
| "self": 161.6172658900191, |
| "children": { |
| "RLTrainer._checkpoint": { |
| "total": 0.31221969399939553, |
| "count": 2, |
| "self": 0.31221969399939553 |
| } |
| } |
| }, |
| "_update_policy": { |
| "total": 868.2216441190026, |
| "count": 450, |
| "self": 357.2702732719622, |
| "children": { |
| "TorchPPOOptimizer.update": { |
| "total": 510.9513708470404, |
| "count": 22812, |
| "self": 510.9513708470404 |
| } |
| } |
| } |
| } |
| } |
| } |
| }, |
| "trainer_threads": { |
| "total": 1.0410003596916795e-06, |
| "count": 1, |
| "self": 1.0410003596916795e-06 |
| }, |
| "TrainerController._save_models": { |
| "total": 0.08461731499937741, |
| "count": 1, |
| "self": 0.001822034999349853, |
| "children": { |
| "RLTrainer._checkpoint": { |
| "total": 0.08279528000002756, |
| "count": 1, |
| "self": 0.08279528000002756 |
| } |
| } |
| } |
| } |
| } |
| } |
| } |