| { |
| "name": "root", |
| "gauges": { |
| "Pyramids.Policy.Entropy.mean": { |
| "value": 0.29789021611213684, |
| "min": 0.29789021611213684, |
| "max": 1.367859959602356, |
| "count": 33 |
| }, |
| "Pyramids.Policy.Entropy.sum": { |
| "value": 8927.173828125, |
| "min": 8927.173828125, |
| "max": 41495.3984375, |
| "count": 33 |
| }, |
| "Pyramids.Step.mean": { |
| "value": 989877.0, |
| "min": 29952.0, |
| "max": 989877.0, |
| "count": 33 |
| }, |
| "Pyramids.Step.sum": { |
| "value": 989877.0, |
| "min": 29952.0, |
| "max": 989877.0, |
| "count": 33 |
| }, |
| "Pyramids.Policy.ExtrinsicValueEstimate.mean": { |
| "value": 0.4172821640968323, |
| "min": -0.09637138247489929, |
| "max": 0.4753468632698059, |
| "count": 33 |
| }, |
| "Pyramids.Policy.ExtrinsicValueEstimate.sum": { |
| "value": 110.57977294921875, |
| "min": -23.22550392150879, |
| "max": 127.39295959472656, |
| "count": 33 |
| }, |
| "Pyramids.Policy.RndValueEstimate.mean": { |
| "value": 0.01254123356193304, |
| "min": 0.01254123356193304, |
| "max": 0.5868200063705444, |
| "count": 33 |
| }, |
| "Pyramids.Policy.RndValueEstimate.sum": { |
| "value": 3.3234269618988037, |
| "min": 3.3234269618988037, |
| "max": 139.0763397216797, |
| "count": 33 |
| }, |
| "Pyramids.Losses.PolicyLoss.mean": { |
| "value": 0.06969978085373227, |
| "min": 0.06552618757951403, |
| "max": 0.07309274904599349, |
| "count": 33 |
| }, |
| "Pyramids.Losses.PolicyLoss.sum": { |
| "value": 0.9757969319522518, |
| "min": 0.5101009684204372, |
| "max": 1.0511480932473205, |
| "count": 33 |
| }, |
| "Pyramids.Losses.ValueLoss.mean": { |
| "value": 0.013070763274574822, |
| "min": 0.00024218573646627502, |
| "max": 0.01475173796227734, |
| "count": 33 |
| }, |
| "Pyramids.Losses.ValueLoss.sum": { |
| "value": 0.1829906858440475, |
| "min": 0.003148414574061575, |
| "max": 0.20652433147188276, |
| "count": 33 |
| }, |
| "Pyramids.Policy.LearningRate.mean": { |
| "value": 7.627683171757142e-06, |
| "min": 7.627683171757142e-06, |
| "max": 0.00029515063018788575, |
| "count": 33 |
| }, |
| "Pyramids.Policy.LearningRate.sum": { |
| "value": 0.0001067875644046, |
| "min": 0.0001067875644046, |
| "max": 0.0034927333357556, |
| "count": 33 |
| }, |
| "Pyramids.Policy.Epsilon.mean": { |
| "value": 0.10254252857142857, |
| "min": 0.10254252857142857, |
| "max": 0.19838354285714285, |
| "count": 33 |
| }, |
| "Pyramids.Policy.Epsilon.sum": { |
| "value": 1.4355954, |
| "min": 1.3886848, |
| "max": 2.5273532000000003, |
| "count": 33 |
| }, |
| "Pyramids.Policy.Beta.mean": { |
| "value": 0.0002639986042857143, |
| "min": 0.0002639986042857143, |
| "max": 0.00983851593142857, |
| "count": 33 |
| }, |
| "Pyramids.Policy.Beta.sum": { |
| "value": 0.00369598046, |
| "min": 0.00369598046, |
| "max": 0.11643801556, |
| "count": 33 |
| }, |
| "Pyramids.Losses.RNDLoss.mean": { |
| "value": 0.03089161030948162, |
| "min": 0.030175942927598953, |
| "max": 0.6546319723129272, |
| "count": 33 |
| }, |
| "Pyramids.Losses.RNDLoss.sum": { |
| "value": 0.4324825406074524, |
| "min": 0.42246320843696594, |
| "max": 4.582423686981201, |
| "count": 33 |
| }, |
| "Pyramids.Environment.EpisodeLength.mean": { |
| "value": 419.1029411764706, |
| "min": 405.5974025974026, |
| "max": 999.0, |
| "count": 33 |
| }, |
| "Pyramids.Environment.EpisodeLength.sum": { |
| "value": 28499.0, |
| "min": 15984.0, |
| "max": 33026.0, |
| "count": 33 |
| }, |
| "Pyramids.Environment.CumulativeReward.mean": { |
| "value": 1.3798144760987032, |
| "min": -1.0000000521540642, |
| "max": 1.4349420881389003, |
| "count": 33 |
| }, |
| "Pyramids.Environment.CumulativeReward.sum": { |
| "value": 95.20719885081053, |
| "min": -31.99480164051056, |
| "max": 109.05559869855642, |
| "count": 33 |
| }, |
| "Pyramids.Policy.ExtrinsicReward.mean": { |
| "value": 1.3798144760987032, |
| "min": -1.0000000521540642, |
| "max": 1.4349420881389003, |
| "count": 33 |
| }, |
| "Pyramids.Policy.ExtrinsicReward.sum": { |
| "value": 95.20719885081053, |
| "min": -31.99480164051056, |
| "max": 109.05559869855642, |
| "count": 33 |
| }, |
| "Pyramids.Policy.RndReward.mean": { |
| "value": 0.13095148351968036, |
| "min": 0.12661478602508155, |
| "max": 13.344655025750399, |
| "count": 33 |
| }, |
| "Pyramids.Policy.RndReward.sum": { |
| "value": 9.035652362857945, |
| "min": 9.035652362857945, |
| "max": 213.51448041200638, |
| "count": 33 |
| }, |
| "Pyramids.IsTraining.mean": { |
| "value": 1.0, |
| "min": 1.0, |
| "max": 1.0, |
| "count": 33 |
| }, |
| "Pyramids.IsTraining.sum": { |
| "value": 1.0, |
| "min": 1.0, |
| "max": 1.0, |
| "count": 33 |
| } |
| }, |
| "metadata": { |
| "timer_format_version": "0.1.0", |
| "start_time_seconds": "1697096574", |
| "python_version": "3.10.12 (main, Jun 11 2023, 05:26:28) [GCC 11.4.0]", |
| "command_line_arguments": "/usr/local/bin/mlagents-learn ./config/ppo/PyramidsRND.yaml --env=./training-envs-executables/linux/Pyramids/Pyramids --run-id=Pyramids Training --no-graphics", |
| "mlagents_version": "1.1.0.dev0", |
| "mlagents_envs_version": "1.1.0.dev0", |
| "communication_protocol_version": "1.5.0", |
| "pytorch_version": "2.0.1+cu118", |
| "numpy_version": "1.23.5", |
| "end_time_seconds": "1697098956" |
| }, |
| "total": 2381.92797918, |
| "count": 1, |
| "self": 0.5345633160000034, |
| "children": { |
| "run_training.setup": { |
| "total": 0.04264655199995104, |
| "count": 1, |
| "self": 0.04264655199995104 |
| }, |
| "TrainerController.start_learning": { |
| "total": 2381.350769312, |
| "count": 1, |
| "self": 1.8312415618911473, |
| "children": { |
| "TrainerController._reset_env": { |
| "total": 3.01589892300035, |
| "count": 1, |
| "self": 3.01589892300035 |
| }, |
| "TrainerController.advance": { |
| "total": 2376.420788169108, |
| "count": 63573, |
| "self": 1.8256890939628647, |
| "children": { |
| "env_step": { |
| "total": 1717.844125627993, |
| "count": 63573, |
| "self": 1568.1376008410944, |
| "children": { |
| "SubprocessEnvManager._take_step": { |
| "total": 148.62241601598453, |
| "count": 63573, |
| "self": 5.393495830064694, |
| "children": { |
| "TorchPolicy.evaluate": { |
| "total": 143.22892018591983, |
| "count": 62579, |
| "self": 143.22892018591983 |
| } |
| } |
| }, |
| "workers": { |
| "total": 1.0841087709140993, |
| "count": 63573, |
| "self": 0.0, |
| "children": { |
| "worker_root": { |
| "total": 2375.8104885870443, |
| "count": 63573, |
| "is_parallel": true, |
| "self": 949.8809644030521, |
| "children": { |
| "run_training.setup": { |
| "total": 0.0, |
| "count": 0, |
| "is_parallel": true, |
| "self": 0.0, |
| "children": { |
| "steps_from_proto": { |
| "total": 0.0022297059999800695, |
| "count": 1, |
| "is_parallel": true, |
| "self": 0.000690978999955405, |
| "children": { |
| "_process_rank_one_or_two_observation": { |
| "total": 0.0015387270000246644, |
| "count": 8, |
| "is_parallel": true, |
| "self": 0.0015387270000246644 |
| } |
| } |
| }, |
| "UnityEnvironment.step": { |
| "total": 0.055314415999873745, |
| "count": 1, |
| "is_parallel": true, |
| "self": 0.0006212250000316999, |
| "children": { |
| "UnityEnvironment._generate_step_input": { |
| "total": 0.0005543299998862494, |
| "count": 1, |
| "is_parallel": true, |
| "self": 0.0005543299998862494 |
| }, |
| "communicator.exchange": { |
| "total": 0.0522933990000638, |
| "count": 1, |
| "is_parallel": true, |
| "self": 0.0522933990000638 |
| }, |
| "steps_from_proto": { |
| "total": 0.0018454619998919952, |
| "count": 1, |
| "is_parallel": true, |
| "self": 0.00041616599992266856, |
| "children": { |
| "_process_rank_one_or_two_observation": { |
| "total": 0.0014292959999693267, |
| "count": 8, |
| "is_parallel": true, |
| "self": 0.0014292959999693267 |
| } |
| } |
| } |
| } |
| } |
| } |
| }, |
| "UnityEnvironment.step": { |
| "total": 1425.9295241839923, |
| "count": 63572, |
| "is_parallel": true, |
| "self": 37.55473791382292, |
| "children": { |
| "UnityEnvironment._generate_step_input": { |
| "total": 26.571704254092765, |
| "count": 63572, |
| "is_parallel": true, |
| "self": 26.571704254092765 |
| }, |
| "communicator.exchange": { |
| "total": 1249.7388750450696, |
| "count": 63572, |
| "is_parallel": true, |
| "self": 1249.7388750450696 |
| }, |
| "steps_from_proto": { |
| "total": 112.06420697100702, |
| "count": 63572, |
| "is_parallel": true, |
| "self": 24.25149092707761, |
| "children": { |
| "_process_rank_one_or_two_observation": { |
| "total": 87.81271604392941, |
| "count": 508576, |
| "is_parallel": true, |
| "self": 87.81271604392941 |
| } |
| } |
| } |
| } |
| } |
| } |
| } |
| } |
| } |
| } |
| }, |
| "trainer_advance": { |
| "total": 656.7509734471523, |
| "count": 63573, |
| "self": 3.1832876372186547, |
| "children": { |
| "process_trajectory": { |
| "total": 131.0972472149324, |
| "count": 63573, |
| "self": 130.9019858219317, |
| "children": { |
| "RLTrainer._checkpoint": { |
| "total": 0.1952613930006919, |
| "count": 2, |
| "self": 0.1952613930006919 |
| } |
| } |
| }, |
| "_update_policy": { |
| "total": 522.4704385950013, |
| "count": 452, |
| "self": 313.2950051690591, |
| "children": { |
| "TorchPPOOptimizer.update": { |
| "total": 209.17543342594217, |
| "count": 22806, |
| "self": 209.17543342594217 |
| } |
| } |
| } |
| } |
| } |
| } |
| }, |
| "trainer_threads": { |
| "total": 1.0140001904801466e-06, |
| "count": 1, |
| "self": 1.0140001904801466e-06 |
| }, |
| "TrainerController._save_models": { |
| "total": 0.08283964400015975, |
| "count": 1, |
| "self": 0.001403623999976844, |
| "children": { |
| "RLTrainer._checkpoint": { |
| "total": 0.08143602000018291, |
| "count": 1, |
| "self": 0.08143602000018291 |
| } |
| } |
| } |
| } |
| } |
| } |
| } |