| { |
| "name": "root", |
| "gauges": { |
| "Pyramids.Policy.Entropy.mean": { |
| "value": 0.44500088691711426, |
| "min": 0.44500088691711426, |
| "max": 1.4098087549209595, |
| "count": 33 |
| }, |
| "Pyramids.Policy.Entropy.sum": { |
| "value": 13335.7861328125, |
| "min": 13335.7861328125, |
| "max": 42767.95703125, |
| "count": 33 |
| }, |
| "Pyramids.Step.mean": { |
| "value": 989955.0, |
| "min": 29952.0, |
| "max": 989955.0, |
| "count": 33 |
| }, |
| "Pyramids.Step.sum": { |
| "value": 989955.0, |
| "min": 29952.0, |
| "max": 989955.0, |
| "count": 33 |
| }, |
| "Pyramids.Policy.ExtrinsicValueEstimate.mean": { |
| "value": 0.4594956338405609, |
| "min": -0.10418813675642014, |
| "max": 0.5874286890029907, |
| "count": 33 |
| }, |
| "Pyramids.Policy.ExtrinsicValueEstimate.sum": { |
| "value": 124.5233154296875, |
| "min": -25.213529586791992, |
| "max": 166.24232482910156, |
| "count": 33 |
| }, |
| "Pyramids.Policy.RndValueEstimate.mean": { |
| "value": 0.06584659963846207, |
| "min": -0.5372107028961182, |
| "max": 0.4068872630596161, |
| "count": 33 |
| }, |
| "Pyramids.Policy.RndValueEstimate.sum": { |
| "value": 17.84442901611328, |
| "min": -146.12130737304688, |
| "max": 96.43228149414062, |
| "count": 33 |
| }, |
| "Pyramids.Losses.PolicyLoss.mean": { |
| "value": 0.06953306640692367, |
| "min": 0.0658238390238867, |
| "max": 0.07514423476892436, |
| "count": 33 |
| }, |
| "Pyramids.Losses.PolicyLoss.sum": { |
| "value": 0.9734629296969313, |
| "min": 0.47950057450972294, |
| "max": 1.052019286764941, |
| "count": 33 |
| }, |
| "Pyramids.Losses.ValueLoss.mean": { |
| "value": 0.05162858053725878, |
| "min": 0.0002478269929841048, |
| "max": 0.05162858053725878, |
| "count": 33 |
| }, |
| "Pyramids.Losses.ValueLoss.sum": { |
| "value": 0.7228001275216229, |
| "min": 0.003221750908793363, |
| "max": 0.7228001275216229, |
| "count": 33 |
| }, |
| "Pyramids.Policy.LearningRate.mean": { |
| "value": 7.477447507550003e-06, |
| "min": 7.477447507550003e-06, |
| "max": 0.00029515063018788575, |
| "count": 33 |
| }, |
| "Pyramids.Policy.LearningRate.sum": { |
| "value": 0.00010468426510570005, |
| "min": 0.00010468426510570005, |
| "max": 0.003254798615067199, |
| "count": 33 |
| }, |
| "Pyramids.Policy.Epsilon.mean": { |
| "value": 0.10249245, |
| "min": 0.10249245, |
| "max": 0.19838354285714285, |
| "count": 33 |
| }, |
| "Pyramids.Policy.Epsilon.sum": { |
| "value": 1.4348943, |
| "min": 1.3691136000000002, |
| "max": 2.3849328, |
| "count": 33 |
| }, |
| "Pyramids.Policy.Beta.mean": { |
| "value": 0.0002589957550000001, |
| "min": 0.0002589957550000001, |
| "max": 0.00983851593142857, |
| "count": 33 |
| }, |
| "Pyramids.Policy.Beta.sum": { |
| "value": 0.0036259405700000014, |
| "min": 0.0036259405700000014, |
| "max": 0.10851478672, |
| "count": 33 |
| }, |
| "Pyramids.Losses.RNDLoss.mean": { |
| "value": 0.008720179088413715, |
| "min": 0.008618001826107502, |
| "max": 0.5024706721305847, |
| "count": 33 |
| }, |
| "Pyramids.Losses.RNDLoss.sum": { |
| "value": 0.12208250164985657, |
| "min": 0.12065202742815018, |
| "max": 3.5172948837280273, |
| "count": 33 |
| }, |
| "Pyramids.Environment.EpisodeLength.mean": { |
| "value": 378.67088607594934, |
| "min": 324.8494623655914, |
| "max": 999.0, |
| "count": 33 |
| }, |
| "Pyramids.Environment.EpisodeLength.sum": { |
| "value": 29915.0, |
| "min": 15984.0, |
| "max": 32512.0, |
| "count": 33 |
| }, |
| "Pyramids.Environment.CumulativeReward.mean": { |
| "value": 1.5170333177233353, |
| "min": -1.0000000521540642, |
| "max": 1.6536429884933657, |
| "count": 33 |
| }, |
| "Pyramids.Environment.CumulativeReward.sum": { |
| "value": 118.32859878242016, |
| "min": -32.000001668930054, |
| "max": 153.788797929883, |
| "count": 33 |
| }, |
| "Pyramids.Policy.ExtrinsicReward.mean": { |
| "value": 1.5170333177233353, |
| "min": -1.0000000521540642, |
| "max": 1.6536429884933657, |
| "count": 33 |
| }, |
| "Pyramids.Policy.ExtrinsicReward.sum": { |
| "value": 118.32859878242016, |
| "min": -32.000001668930054, |
| "max": 153.788797929883, |
| "count": 33 |
| }, |
| "Pyramids.Policy.RndReward.mean": { |
| "value": 0.034244005688845225, |
| "min": 0.029824881925828436, |
| "max": 10.70782103575766, |
| "count": 33 |
| }, |
| "Pyramids.Policy.RndReward.sum": { |
| "value": 2.6710324437299278, |
| "min": 2.6710324437299278, |
| "max": 171.32513657212257, |
| "count": 33 |
| }, |
| "Pyramids.IsTraining.mean": { |
| "value": 1.0, |
| "min": 1.0, |
| "max": 1.0, |
| "count": 33 |
| }, |
| "Pyramids.IsTraining.sum": { |
| "value": 1.0, |
| "min": 1.0, |
| "max": 1.0, |
| "count": 33 |
| } |
| }, |
| "metadata": { |
| "timer_format_version": "0.1.0", |
| "start_time_seconds": "1677785858", |
| "python_version": "3.8.10 (default, Nov 14 2022, 12:59:47) \n[GCC 9.4.0]", |
| "command_line_arguments": "/usr/local/bin/mlagents-learn ./config/ppo/PyramidsRND.yaml --env=./training-envs-executables/linux/Pyramids/Pyramids --run-id=Pyramids Training --no-graphics", |
| "mlagents_version": "0.29.0.dev0", |
| "mlagents_envs_version": "0.29.0.dev0", |
| "communication_protocol_version": "1.5.0", |
| "pytorch_version": "1.8.1+cu102", |
| "numpy_version": "1.22.4", |
| "end_time_seconds": "1677788174" |
| }, |
| "total": 2316.566591193, |
| "count": 1, |
| "self": 0.49688419800031625, |
| "children": { |
| "run_training.setup": { |
| "total": 0.11144246999992902, |
| "count": 1, |
| "self": 0.11144246999992902 |
| }, |
| "TrainerController.start_learning": { |
| "total": 2315.958264525, |
| "count": 1, |
| "self": 1.283985963032137, |
| "children": { |
| "TrainerController._reset_env": { |
| "total": 7.2134846740000285, |
| "count": 1, |
| "self": 7.2134846740000285 |
| }, |
| "TrainerController.advance": { |
| "total": 2307.3721222039676, |
| "count": 63775, |
| "self": 1.3955447060034203, |
| "children": { |
| "env_step": { |
| "total": 1550.598698021013, |
| "count": 63775, |
| "self": 1438.5709304770357, |
| "children": { |
| "SubprocessEnvManager._take_step": { |
| "total": 111.21656685699645, |
| "count": 63775, |
| "self": 4.661132751949708, |
| "children": { |
| "TorchPolicy.evaluate": { |
| "total": 106.55543410504674, |
| "count": 62559, |
| "self": 36.212146297036725, |
| "children": { |
| "TorchPolicy.sample_actions": { |
| "total": 70.34328780801002, |
| "count": 62559, |
| "self": 70.34328780801002 |
| } |
| } |
| } |
| } |
| }, |
| "workers": { |
| "total": 0.8112006869807828, |
| "count": 63775, |
| "self": 0.0, |
| "children": { |
| "worker_root": { |
| "total": 2311.2174265830226, |
| "count": 63775, |
| "is_parallel": true, |
| "self": 986.0854838100192, |
| "children": { |
| "run_training.setup": { |
| "total": 0.0, |
| "count": 0, |
| "is_parallel": true, |
| "self": 0.0, |
| "children": { |
| "steps_from_proto": { |
| "total": 0.0021046189999651688, |
| "count": 1, |
| "is_parallel": true, |
| "self": 0.0007118419996459124, |
| "children": { |
| "_process_rank_one_or_two_observation": { |
| "total": 0.0013927770003192563, |
| "count": 8, |
| "is_parallel": true, |
| "self": 0.0013927770003192563 |
| } |
| } |
| }, |
| "UnityEnvironment.step": { |
| "total": 0.04606312600003548, |
| "count": 1, |
| "is_parallel": true, |
| "self": 0.0005507810001290636, |
| "children": { |
| "UnityEnvironment._generate_step_input": { |
| "total": 0.00042988499990315177, |
| "count": 1, |
| "is_parallel": true, |
| "self": 0.00042988499990315177 |
| }, |
| "communicator.exchange": { |
| "total": 0.04338404800000717, |
| "count": 1, |
| "is_parallel": true, |
| "self": 0.04338404800000717 |
| }, |
| "steps_from_proto": { |
| "total": 0.0016984119999960967, |
| "count": 1, |
| "is_parallel": true, |
| "self": 0.0003874379999615485, |
| "children": { |
| "_process_rank_one_or_two_observation": { |
| "total": 0.0013109740000345482, |
| "count": 8, |
| "is_parallel": true, |
| "self": 0.0013109740000345482 |
| } |
| } |
| } |
| } |
| } |
| } |
| }, |
| "UnityEnvironment.step": { |
| "total": 1325.1319427730034, |
| "count": 63774, |
| "is_parallel": true, |
| "self": 31.7022571140094, |
| "children": { |
| "UnityEnvironment._generate_step_input": { |
| "total": 23.277163388958115, |
| "count": 63774, |
| "is_parallel": true, |
| "self": 23.277163388958115 |
| }, |
| "communicator.exchange": { |
| "total": 1177.832288414997, |
| "count": 63774, |
| "is_parallel": true, |
| "self": 1177.832288414997 |
| }, |
| "steps_from_proto": { |
| "total": 92.32023385503885, |
| "count": 63774, |
| "is_parallel": true, |
| "self": 21.764683111133763, |
| "children": { |
| "_process_rank_one_or_two_observation": { |
| "total": 70.55555074390509, |
| "count": 510192, |
| "is_parallel": true, |
| "self": 70.55555074390509 |
| } |
| } |
| } |
| } |
| } |
| } |
| } |
| } |
| } |
| } |
| }, |
| "trainer_advance": { |
| "total": 755.3778794769514, |
| "count": 63775, |
| "self": 2.383214044932629, |
| "children": { |
| "process_trajectory": { |
| "total": 164.73012766101965, |
| "count": 63775, |
| "self": 164.54556063801965, |
| "children": { |
| "RLTrainer._checkpoint": { |
| "total": 0.1845670229999996, |
| "count": 2, |
| "self": 0.1845670229999996 |
| } |
| } |
| }, |
| "_update_policy": { |
| "total": 588.2645377709991, |
| "count": 438, |
| "self": 228.8944533430058, |
| "children": { |
| "TorchPPOOptimizer.update": { |
| "total": 359.37008442799333, |
| "count": 22830, |
| "self": 359.37008442799333 |
| } |
| } |
| } |
| } |
| } |
| } |
| }, |
| "trainer_threads": { |
| "total": 1.03899992609513e-06, |
| "count": 1, |
| "self": 1.03899992609513e-06 |
| }, |
| "TrainerController._save_models": { |
| "total": 0.08867064500009292, |
| "count": 1, |
| "self": 0.0018972440002471558, |
| "children": { |
| "RLTrainer._checkpoint": { |
| "total": 0.08677340099984576, |
| "count": 1, |
| "self": 0.08677340099984576 |
| } |
| } |
| } |
| } |
| } |
| } |
| } |