| { |
| "name": "root", |
| "gauges": { |
| "Pyramids.Policy.Entropy.mean": { |
| "value": 0.6612257361412048, |
| "min": 0.6612257361412048, |
| "max": 1.3829609155654907, |
| "count": 33 |
| }, |
| "Pyramids.Policy.Entropy.sum": { |
| "value": 19678.078125, |
| "min": 19678.078125, |
| "max": 41953.50390625, |
| "count": 33 |
| }, |
| "Pyramids.Step.mean": { |
| "value": 989883.0, |
| "min": 29952.0, |
| "max": 989883.0, |
| "count": 33 |
| }, |
| "Pyramids.Step.sum": { |
| "value": 989883.0, |
| "min": 29952.0, |
| "max": 989883.0, |
| "count": 33 |
| }, |
| "Pyramids.Policy.ExtrinsicValueEstimate.mean": { |
| "value": 0.0627322718501091, |
| "min": -0.11199305951595306, |
| "max": 0.09172578901052475, |
| "count": 33 |
| }, |
| "Pyramids.Policy.ExtrinsicValueEstimate.sum": { |
| "value": 15.432138442993164, |
| "min": -27.102319717407227, |
| "max": 22.656269073486328, |
| "count": 33 |
| }, |
| "Pyramids.Policy.RndValueEstimate.mean": { |
| "value": 0.02176976017653942, |
| "min": 0.007074796594679356, |
| "max": 0.35083121061325073, |
| "count": 33 |
| }, |
| "Pyramids.Policy.RndValueEstimate.sum": { |
| "value": 5.355360984802246, |
| "min": 1.7474747896194458, |
| "max": 84.19949340820312, |
| "count": 33 |
| }, |
| "Pyramids.Losses.PolicyLoss.mean": { |
| "value": 0.06850646806835832, |
| "min": 0.06398289415049703, |
| "max": 0.07310759250863705, |
| "count": 33 |
| }, |
| "Pyramids.Losses.PolicyLoss.sum": { |
| "value": 0.9590905529570164, |
| "min": 0.4798651467052846, |
| "max": 1.0437771753045928, |
| "count": 33 |
| }, |
| "Pyramids.Losses.ValueLoss.mean": { |
| "value": 0.005933725971596435, |
| "min": 0.0002992366546125215, |
| "max": 0.005982384877318827, |
| "count": 33 |
| }, |
| "Pyramids.Losses.ValueLoss.sum": { |
| "value": 0.08307216360235009, |
| "min": 0.002992366546125215, |
| "max": 0.08307216360235009, |
| "count": 33 |
| }, |
| "Pyramids.Policy.LearningRate.mean": { |
| "value": 7.464118940564287e-06, |
| "min": 7.464118940564287e-06, |
| "max": 0.00029515063018788575, |
| "count": 33 |
| }, |
| "Pyramids.Policy.LearningRate.sum": { |
| "value": 0.00010449766516790002, |
| "min": 0.00010449766516790002, |
| "max": 0.0030207608930798, |
| "count": 33 |
| }, |
| "Pyramids.Policy.Epsilon.mean": { |
| "value": 0.10248800714285713, |
| "min": 0.10248800714285713, |
| "max": 0.19838354285714285, |
| "count": 33 |
| }, |
| "Pyramids.Policy.Epsilon.sum": { |
| "value": 1.4348321, |
| "min": 1.3691136000000002, |
| "max": 2.359057, |
| "count": 33 |
| }, |
| "Pyramids.Policy.Beta.mean": { |
| "value": 0.0002585519135714287, |
| "min": 0.0002585519135714287, |
| "max": 0.00983851593142857, |
| "count": 33 |
| }, |
| "Pyramids.Policy.Beta.sum": { |
| "value": 0.003619726790000002, |
| "min": 0.003619726790000002, |
| "max": 0.10072132798, |
| "count": 33 |
| }, |
| "Pyramids.Losses.RNDLoss.mean": { |
| "value": 0.014452091418206692, |
| "min": 0.014279200695455074, |
| "max": 0.42627301812171936, |
| "count": 33 |
| }, |
| "Pyramids.Losses.RNDLoss.sum": { |
| "value": 0.20232927799224854, |
| "min": 0.20070239901542664, |
| "max": 2.9839110374450684, |
| "count": 33 |
| }, |
| "Pyramids.Environment.EpisodeLength.mean": { |
| "value": 805.4, |
| "min": 795.5263157894736, |
| "max": 999.0, |
| "count": 33 |
| }, |
| "Pyramids.Environment.EpisodeLength.sum": { |
| "value": 28189.0, |
| "min": 15984.0, |
| "max": 32406.0, |
| "count": 33 |
| }, |
| "Pyramids.Environment.CumulativeReward.mean": { |
| "value": 0.28002281444413324, |
| "min": -1.0000000521540642, |
| "max": 0.28002281444413324, |
| "count": 33 |
| }, |
| "Pyramids.Environment.CumulativeReward.sum": { |
| "value": 9.800798505544662, |
| "min": -32.000001668930054, |
| "max": 9.800798505544662, |
| "count": 33 |
| }, |
| "Pyramids.Policy.ExtrinsicReward.mean": { |
| "value": 0.28002281444413324, |
| "min": -1.0000000521540642, |
| "max": 0.28002281444413324, |
| "count": 33 |
| }, |
| "Pyramids.Policy.ExtrinsicReward.sum": { |
| "value": 9.800798505544662, |
| "min": -32.000001668930054, |
| "max": 9.800798505544662, |
| "count": 33 |
| }, |
| "Pyramids.Policy.RndReward.mean": { |
| "value": 0.12133785032866788, |
| "min": 0.11832984130925094, |
| "max": 8.416626082733274, |
| "count": 33 |
| }, |
| "Pyramids.Policy.RndReward.sum": { |
| "value": 4.246824761503376, |
| "min": 4.213088566903025, |
| "max": 134.66601732373238, |
| "count": 33 |
| }, |
| "Pyramids.IsTraining.mean": { |
| "value": 1.0, |
| "min": 1.0, |
| "max": 1.0, |
| "count": 33 |
| }, |
| "Pyramids.IsTraining.sum": { |
| "value": 1.0, |
| "min": 1.0, |
| "max": 1.0, |
| "count": 33 |
| } |
| }, |
| "metadata": { |
| "timer_format_version": "0.1.0", |
| "start_time_seconds": "1742555351", |
| "python_version": "3.10.12 (main, Jul 5 2023, 18:54:27) [GCC 11.2.0]", |
| "command_line_arguments": "/usr/local/bin/mlagents-learn ./config/ppo/PyramidsRND.yaml --env=./training-envs-executables/linux/Pyramids/Pyramids --run-id=Pyramids Training --no-graphics", |
| "mlagents_version": "1.2.0.dev0", |
| "mlagents_envs_version": "1.2.0.dev0", |
| "communication_protocol_version": "1.5.0", |
| "pytorch_version": "2.6.0+cu124", |
| "numpy_version": "1.23.5", |
| "end_time_seconds": "1742557830" |
| }, |
| "total": 2479.1611598629997, |
| "count": 1, |
| "self": 0.5758834610001031, |
| "children": { |
| "run_training.setup": { |
| "total": 0.034341406999828905, |
| "count": 1, |
| "self": 0.034341406999828905 |
| }, |
| "TrainerController.start_learning": { |
| "total": 2478.550934995, |
| "count": 1, |
| "self": 2.433458263002649, |
| "children": { |
| "TrainerController._reset_env": { |
| "total": 2.978400418000092, |
| "count": 1, |
| "self": 2.978400418000092 |
| }, |
| "TrainerController.advance": { |
| "total": 2473.0697424669975, |
| "count": 63162, |
| "self": 2.4555728870204803, |
| "children": { |
| "env_step": { |
| "total": 1645.1093814070057, |
| "count": 63162, |
| "self": 1487.5745012469147, |
| "children": { |
| "SubprocessEnvManager._take_step": { |
| "total": 156.12895080501517, |
| "count": 63162, |
| "self": 6.11167329604973, |
| "children": { |
| "TorchPolicy.evaluate": { |
| "total": 150.01727750896544, |
| "count": 62546, |
| "self": 150.01727750896544 |
| } |
| } |
| }, |
| "workers": { |
| "total": 1.4059293550758412, |
| "count": 63162, |
| "self": 0.0, |
| "children": { |
| "worker_root": { |
| "total": 2471.5795739230416, |
| "count": 63162, |
| "is_parallel": true, |
| "self": 1141.1593669769836, |
| "children": { |
| "run_training.setup": { |
| "total": 0.0, |
| "count": 0, |
| "is_parallel": true, |
| "self": 0.0, |
| "children": { |
| "steps_from_proto": { |
| "total": 0.004115429999956177, |
| "count": 1, |
| "is_parallel": true, |
| "self": 0.0016213500002777437, |
| "children": { |
| "_process_rank_one_or_two_observation": { |
| "total": 0.0024940799996784335, |
| "count": 8, |
| "is_parallel": true, |
| "self": 0.0024940799996784335 |
| } |
| } |
| }, |
| "UnityEnvironment.step": { |
| "total": 0.07220375299993975, |
| "count": 1, |
| "is_parallel": true, |
| "self": 0.0005890499996894505, |
| "children": { |
| "UnityEnvironment._generate_step_input": { |
| "total": 0.000539300000127696, |
| "count": 1, |
| "is_parallel": true, |
| "self": 0.000539300000127696 |
| }, |
| "communicator.exchange": { |
| "total": 0.06930812300015532, |
| "count": 1, |
| "is_parallel": true, |
| "self": 0.06930812300015532 |
| }, |
| "steps_from_proto": { |
| "total": 0.0017672799999672861, |
| "count": 1, |
| "is_parallel": true, |
| "self": 0.0003825600001619023, |
| "children": { |
| "_process_rank_one_or_two_observation": { |
| "total": 0.0013847199998053838, |
| "count": 8, |
| "is_parallel": true, |
| "self": 0.0013847199998053838 |
| } |
| } |
| } |
| } |
| } |
| } |
| }, |
| "UnityEnvironment.step": { |
| "total": 1330.420206946058, |
| "count": 63161, |
| "is_parallel": true, |
| "self": 38.685660551049295, |
| "children": { |
| "UnityEnvironment._generate_step_input": { |
| "total": 27.595473760981577, |
| "count": 63161, |
| "is_parallel": true, |
| "self": 27.595473760981577 |
| }, |
| "communicator.exchange": { |
| "total": 1162.6839711710654, |
| "count": 63161, |
| "is_parallel": true, |
| "self": 1162.6839711710654 |
| }, |
| "steps_from_proto": { |
| "total": 101.4551014629617, |
| "count": 63161, |
| "is_parallel": true, |
| "self": 23.00321879287071, |
| "children": { |
| "_process_rank_one_or_two_observation": { |
| "total": 78.45188267009098, |
| "count": 505288, |
| "is_parallel": true, |
| "self": 78.45188267009098 |
| } |
| } |
| } |
| } |
| } |
| } |
| } |
| } |
| } |
| } |
| }, |
| "trainer_advance": { |
| "total": 825.5047881729715, |
| "count": 63162, |
| "self": 4.589303499991047, |
| "children": { |
| "process_trajectory": { |
| "total": 138.26821690098018, |
| "count": 63162, |
| "self": 137.73092742998028, |
| "children": { |
| "RLTrainer._checkpoint": { |
| "total": 0.5372894709998945, |
| "count": 2, |
| "self": 0.5372894709998945 |
| } |
| } |
| }, |
| "_update_policy": { |
| "total": 682.6472677720003, |
| "count": 433, |
| "self": 264.3730516609744, |
| "children": { |
| "TorchPPOOptimizer.update": { |
| "total": 418.2742161110259, |
| "count": 22863, |
| "self": 418.2742161110259 |
| } |
| } |
| } |
| } |
| } |
| } |
| }, |
| "trainer_threads": { |
| "total": 1.4299998838396277e-06, |
| "count": 1, |
| "self": 1.4299998838396277e-06 |
| }, |
| "TrainerController._save_models": { |
| "total": 0.06933241699971404, |
| "count": 1, |
| "self": 0.0014144899996608729, |
| "children": { |
| "RLTrainer._checkpoint": { |
| "total": 0.06791792700005317, |
| "count": 1, |
| "self": 0.06791792700005317 |
| } |
| } |
| } |
| } |
| } |
| } |
| } |