| { |
| "name": "root", |
| "gauges": { |
| "Pyramids.Policy.Entropy.mean": { |
| "value": 0.5008999705314636, |
| "min": 0.4773056209087372, |
| "max": 1.4854872226715088, |
| "count": 33 |
| }, |
| "Pyramids.Policy.Entropy.sum": { |
| "value": 15123.171875, |
| "min": 14242.7998046875, |
| "max": 45063.7421875, |
| "count": 33 |
| }, |
| "Pyramids.Step.mean": { |
| "value": 989944.0, |
| "min": 29952.0, |
| "max": 989944.0, |
| "count": 33 |
| }, |
| "Pyramids.Step.sum": { |
| "value": 989944.0, |
| "min": 29952.0, |
| "max": 989944.0, |
| "count": 33 |
| }, |
| "Pyramids.Policy.ExtrinsicValueEstimate.mean": { |
| "value": 0.24567793309688568, |
| "min": -0.10527270287275314, |
| "max": 0.2654494345188141, |
| "count": 33 |
| }, |
| "Pyramids.Policy.ExtrinsicValueEstimate.sum": { |
| "value": 61.91083908081055, |
| "min": -25.26544952392578, |
| "max": 68.75140380859375, |
| "count": 33 |
| }, |
| "Pyramids.Policy.RndValueEstimate.mean": { |
| "value": 0.06088830158114433, |
| "min": -0.019152160733938217, |
| "max": 0.2694939970970154, |
| "count": 33 |
| }, |
| "Pyramids.Policy.RndValueEstimate.sum": { |
| "value": 15.343852043151855, |
| "min": -4.768887996673584, |
| "max": 63.87007522583008, |
| "count": 33 |
| }, |
| "Pyramids.Losses.PolicyLoss.mean": { |
| "value": 0.07094593892026892, |
| "min": 0.0651082992406091, |
| "max": 0.07574394675795973, |
| "count": 33 |
| }, |
| "Pyramids.Losses.PolicyLoss.sum": { |
| "value": 1.0641890838040338, |
| "min": 0.5302076273057181, |
| "max": 1.0641890838040338, |
| "count": 33 |
| }, |
| "Pyramids.Losses.ValueLoss.mean": { |
| "value": 0.009234968995188669, |
| "min": 0.0005701018202355009, |
| "max": 0.014187979038036782, |
| "count": 33 |
| }, |
| "Pyramids.Losses.ValueLoss.sum": { |
| "value": 0.13852453492783004, |
| "min": 0.007981425483297012, |
| "max": 0.19863170653251494, |
| "count": 33 |
| }, |
| "Pyramids.Policy.LearningRate.mean": { |
| "value": 7.5044174985600025e-06, |
| "min": 7.5044174985600025e-06, |
| "max": 0.00029515063018788575, |
| "count": 33 |
| }, |
| "Pyramids.Policy.LearningRate.sum": { |
| "value": 0.00011256626247840004, |
| "min": 0.00011256626247840004, |
| "max": 0.0036301444899518994, |
| "count": 33 |
| }, |
| "Pyramids.Policy.Epsilon.mean": { |
| "value": 0.10250144000000001, |
| "min": 0.10250144000000001, |
| "max": 0.19838354285714285, |
| "count": 33 |
| }, |
| "Pyramids.Policy.Epsilon.sum": { |
| "value": 1.5375216000000003, |
| "min": 1.3886848, |
| "max": 2.6100480999999998, |
| "count": 33 |
| }, |
| "Pyramids.Policy.Beta.mean": { |
| "value": 0.00025989385600000013, |
| "min": 0.00025989385600000013, |
| "max": 0.00983851593142857, |
| "count": 33 |
| }, |
| "Pyramids.Policy.Beta.sum": { |
| "value": 0.003898407840000002, |
| "min": 0.003898407840000002, |
| "max": 0.12102380519, |
| "count": 33 |
| }, |
| "Pyramids.Losses.RNDLoss.mean": { |
| "value": 0.008191419765353203, |
| "min": 0.007582017220556736, |
| "max": 0.34768661856651306, |
| "count": 33 |
| }, |
| "Pyramids.Losses.RNDLoss.sum": { |
| "value": 0.12287130206823349, |
| "min": 0.10614824295043945, |
| "max": 2.4338064193725586, |
| "count": 33 |
| }, |
| "Pyramids.Environment.EpisodeLength.mean": { |
| "value": 584.0217391304348, |
| "min": 579.433962264151, |
| "max": 999.0, |
| "count": 33 |
| }, |
| "Pyramids.Environment.EpisodeLength.sum": { |
| "value": 26865.0, |
| "min": 15984.0, |
| "max": 33031.0, |
| "count": 33 |
| }, |
| "Pyramids.Environment.CumulativeReward.mean": { |
| "value": 1.0245390949041948, |
| "min": -1.0000000521540642, |
| "max": 1.0245390949041948, |
| "count": 33 |
| }, |
| "Pyramids.Environment.CumulativeReward.sum": { |
| "value": 47.12879836559296, |
| "min": -28.674001529812813, |
| "max": 51.282198294997215, |
| "count": 33 |
| }, |
| "Pyramids.Policy.ExtrinsicReward.mean": { |
| "value": 1.0245390949041948, |
| "min": -1.0000000521540642, |
| "max": 1.0245390949041948, |
| "count": 33 |
| }, |
| "Pyramids.Policy.ExtrinsicReward.sum": { |
| "value": 47.12879836559296, |
| "min": -28.674001529812813, |
| "max": 51.282198294997215, |
| "count": 33 |
| }, |
| "Pyramids.Policy.RndReward.mean": { |
| "value": 0.052135885666559814, |
| "min": 0.04904970410167992, |
| "max": 7.379755293019116, |
| "count": 33 |
| }, |
| "Pyramids.Policy.RndReward.sum": { |
| "value": 2.3982507406617515, |
| "min": 2.3982507406617515, |
| "max": 118.07608468830585, |
| "count": 33 |
| }, |
| "Pyramids.IsTraining.mean": { |
| "value": 1.0, |
| "min": 1.0, |
| "max": 1.0, |
| "count": 33 |
| }, |
| "Pyramids.IsTraining.sum": { |
| "value": 1.0, |
| "min": 1.0, |
| "max": 1.0, |
| "count": 33 |
| } |
| }, |
| "metadata": { |
| "timer_format_version": "0.1.0", |
| "start_time_seconds": "1697016972", |
| "python_version": "3.10.12 (main, Jun 11 2023, 05:26:28) [GCC 11.4.0]", |
| "command_line_arguments": "/usr/local/bin/mlagents-learn ./config/ppo/PyramidsRND.yaml --env=./training-envs-executables/linux/Pyramids/Pyramids --run-id=Pyramids Training V2 --no-graphics", |
| "mlagents_version": "1.1.0.dev0", |
| "mlagents_envs_version": "1.1.0.dev0", |
| "communication_protocol_version": "1.5.0", |
| "pytorch_version": "2.0.1+cu118", |
| "numpy_version": "1.21.2", |
| "end_time_seconds": "1697019303" |
| }, |
| "total": 2331.076256431, |
| "count": 1, |
| "self": 0.48035659000015585, |
| "children": { |
| "run_training.setup": { |
| "total": 0.04397408300019379, |
| "count": 1, |
| "self": 0.04397408300019379 |
| }, |
| "TrainerController.start_learning": { |
| "total": 2330.5519257579995, |
| "count": 1, |
| "self": 1.6238535508900895, |
| "children": { |
| "TrainerController._reset_env": { |
| "total": 3.7216097270002138, |
| "count": 1, |
| "self": 3.7216097270002138 |
| }, |
| "TrainerController.advance": { |
| "total": 2325.1291281851095, |
| "count": 63316, |
| "self": 1.566923036195476, |
| "children": { |
| "env_step": { |
| "total": 1622.062057330972, |
| "count": 63316, |
| "self": 1485.839115200004, |
| "children": { |
| "SubprocessEnvManager._take_step": { |
| "total": 135.26355448800177, |
| "count": 63316, |
| "self": 4.993670367158757, |
| "children": { |
| "TorchPolicy.evaluate": { |
| "total": 130.26988412084302, |
| "count": 62560, |
| "self": 130.26988412084302 |
| } |
| } |
| }, |
| "workers": { |
| "total": 0.9593876429662487, |
| "count": 63316, |
| "self": 0.0, |
| "children": { |
| "worker_root": { |
| "total": 2325.495550961981, |
| "count": 63316, |
| "is_parallel": true, |
| "self": 964.9432444899144, |
| "children": { |
| "run_training.setup": { |
| "total": 0.0, |
| "count": 0, |
| "is_parallel": true, |
| "self": 0.0, |
| "children": { |
| "steps_from_proto": { |
| "total": 0.0020056560001648904, |
| "count": 1, |
| "is_parallel": true, |
| "self": 0.0006361600012496638, |
| "children": { |
| "_process_rank_one_or_two_observation": { |
| "total": 0.0013694959989152267, |
| "count": 8, |
| "is_parallel": true, |
| "self": 0.0013694959989152267 |
| } |
| } |
| }, |
| "UnityEnvironment.step": { |
| "total": 0.08765681999966546, |
| "count": 1, |
| "is_parallel": true, |
| "self": 0.0005577549991357955, |
| "children": { |
| "UnityEnvironment._generate_step_input": { |
| "total": 0.0004937700000482437, |
| "count": 1, |
| "is_parallel": true, |
| "self": 0.0004937700000482437 |
| }, |
| "communicator.exchange": { |
| "total": 0.08471973800033084, |
| "count": 1, |
| "is_parallel": true, |
| "self": 0.08471973800033084 |
| }, |
| "steps_from_proto": { |
| "total": 0.001885557000150584, |
| "count": 1, |
| "is_parallel": true, |
| "self": 0.00039294400085054804, |
| "children": { |
| "_process_rank_one_or_two_observation": { |
| "total": 0.0014926129993000359, |
| "count": 8, |
| "is_parallel": true, |
| "self": 0.0014926129993000359 |
| } |
| } |
| } |
| } |
| } |
| } |
| }, |
| "UnityEnvironment.step": { |
| "total": 1360.5523064720664, |
| "count": 63315, |
| "is_parallel": true, |
| "self": 35.12377299516129, |
| "children": { |
| "UnityEnvironment._generate_step_input": { |
| "total": 24.168969467937586, |
| "count": 63315, |
| "is_parallel": true, |
| "self": 24.168969467937586 |
| }, |
| "communicator.exchange": { |
| "total": 1191.4457042949516, |
| "count": 63315, |
| "is_parallel": true, |
| "self": 1191.4457042949516 |
| }, |
| "steps_from_proto": { |
| "total": 109.81385971401596, |
| "count": 63315, |
| "is_parallel": true, |
| "self": 22.217671704017903, |
| "children": { |
| "_process_rank_one_or_two_observation": { |
| "total": 87.59618800999806, |
| "count": 506520, |
| "is_parallel": true, |
| "self": 87.59618800999806 |
| } |
| } |
| } |
| } |
| } |
| } |
| } |
| } |
| } |
| } |
| }, |
| "trainer_advance": { |
| "total": 701.500147817942, |
| "count": 63316, |
| "self": 3.005095362015709, |
| "children": { |
| "process_trajectory": { |
| "total": 123.75213156392829, |
| "count": 63316, |
| "self": 123.57756627792878, |
| "children": { |
| "RLTrainer._checkpoint": { |
| "total": 0.17456528599950616, |
| "count": 2, |
| "self": 0.17456528599950616 |
| } |
| } |
| }, |
| "_update_policy": { |
| "total": 574.742920891998, |
| "count": 453, |
| "self": 370.57453853799143, |
| "children": { |
| "TorchPPOOptimizer.update": { |
| "total": 204.16838235400655, |
| "count": 22755, |
| "self": 204.16838235400655 |
| } |
| } |
| } |
| } |
| } |
| } |
| }, |
| "trainer_threads": { |
| "total": 1.3179997040424496e-06, |
| "count": 1, |
| "self": 1.3179997040424496e-06 |
| }, |
| "TrainerController._save_models": { |
| "total": 0.0773329769999691, |
| "count": 1, |
| "self": 0.001754999000695534, |
| "children": { |
| "RLTrainer._checkpoint": { |
| "total": 0.07557797799927357, |
| "count": 1, |
| "self": 0.07557797799927357 |
| } |
| } |
| } |
| } |
| } |
| } |
| } |