| { |
| "name": "root", |
| "gauges": { |
| "Pyramids.Policy.Entropy.mean": { |
| "value": 0.13125251233577728, |
| "min": 0.1266728788614273, |
| "max": 1.4334834814071655, |
| "count": 100 |
| }, |
| "Pyramids.Policy.Entropy.sum": { |
| "value": 3937.575439453125, |
| "min": 3788.02587890625, |
| "max": 43486.15625, |
| "count": 100 |
| }, |
| "Pyramids.Step.mean": { |
| "value": 2999971.0, |
| "min": 29952.0, |
| "max": 2999971.0, |
| "count": 100 |
| }, |
| "Pyramids.Step.sum": { |
| "value": 2999971.0, |
| "min": 29952.0, |
| "max": 2999971.0, |
| "count": 100 |
| }, |
| "Pyramids.Policy.ExtrinsicValueEstimate.mean": { |
| "value": 0.7409255504608154, |
| "min": -0.10395684093236923, |
| "max": 0.8428269028663635, |
| "count": 100 |
| }, |
| "Pyramids.Policy.ExtrinsicValueEstimate.sum": { |
| "value": 214.868408203125, |
| "min": -24.949642181396484, |
| "max": 255.37655639648438, |
| "count": 100 |
| }, |
| "Pyramids.Policy.RndValueEstimate.mean": { |
| "value": 0.014302385039627552, |
| "min": -0.08000713586807251, |
| "max": 0.3142332434654236, |
| "count": 100 |
| }, |
| "Pyramids.Policy.RndValueEstimate.sum": { |
| "value": 4.14769172668457, |
| "min": -20.641841888427734, |
| "max": 75.73020935058594, |
| "count": 100 |
| }, |
| "Pyramids.Losses.PolicyLoss.mean": { |
| "value": 0.06710547671814095, |
| "min": 0.0634419109643906, |
| "max": 0.07480556164908611, |
| "count": 100 |
| }, |
| "Pyramids.Losses.PolicyLoss.sum": { |
| "value": 0.9394766740539732, |
| "min": 0.4866420462852659, |
| "max": 1.0744367132702952, |
| "count": 100 |
| }, |
| "Pyramids.Losses.ValueLoss.mean": { |
| "value": 0.01554489962013793, |
| "min": 0.0006077335625649556, |
| "max": 0.01744368394845099, |
| "count": 100 |
| }, |
| "Pyramids.Losses.ValueLoss.sum": { |
| "value": 0.21762859468193102, |
| "min": 0.008330488975790263, |
| "max": 0.2610343461856246, |
| "count": 100 |
| }, |
| "Pyramids.Policy.LearningRate.mean": { |
| "value": 1.4382138063428581e-06, |
| "min": 1.4382138063428581e-06, |
| "max": 0.00029838354339596195, |
| "count": 100 |
| }, |
| "Pyramids.Policy.LearningRate.sum": { |
| "value": 2.0134993288800014e-05, |
| "min": 2.0134993288800014e-05, |
| "max": 0.003969560076813332, |
| "count": 100 |
| }, |
| "Pyramids.Policy.Epsilon.mean": { |
| "value": 0.10047937142857145, |
| "min": 0.10047937142857145, |
| "max": 0.19946118095238097, |
| "count": 100 |
| }, |
| "Pyramids.Policy.Epsilon.sum": { |
| "value": 1.4067112000000004, |
| "min": 1.3962282666666668, |
| "max": 2.737505266666667, |
| "count": 100 |
| }, |
| "Pyramids.Policy.Beta.mean": { |
| "value": 5.788920571428576e-05, |
| "min": 5.788920571428576e-05, |
| "max": 0.009946171977142856, |
| "count": 100 |
| }, |
| "Pyramids.Policy.Beta.sum": { |
| "value": 0.0008104488800000007, |
| "min": 0.0008104488800000007, |
| "max": 0.13232634799999998, |
| "count": 100 |
| }, |
| "Pyramids.Losses.RNDLoss.mean": { |
| "value": 0.006704431492835283, |
| "min": 0.006704431492835283, |
| "max": 0.48235660791397095, |
| "count": 100 |
| }, |
| "Pyramids.Losses.RNDLoss.sum": { |
| "value": 0.09386204183101654, |
| "min": 0.09386204183101654, |
| "max": 3.3764963150024414, |
| "count": 100 |
| }, |
| "Pyramids.Environment.EpisodeLength.mean": { |
| "value": 250.67241379310346, |
| "min": 210.52482269503545, |
| "max": 999.0, |
| "count": 100 |
| }, |
| "Pyramids.Environment.EpisodeLength.sum": { |
| "value": 29078.0, |
| "min": 15984.0, |
| "max": 32958.0, |
| "count": 100 |
| }, |
| "Pyramids.Environment.CumulativeReward.mean": { |
| "value": 1.697591361043782, |
| "min": -1.0000000521540642, |
| "max": 1.7752850921230112, |
| "count": 100 |
| }, |
| "Pyramids.Environment.CumulativeReward.sum": { |
| "value": 196.92059788107872, |
| "min": -30.433601640164852, |
| "max": 250.3151979893446, |
| "count": 100 |
| }, |
| "Pyramids.Policy.ExtrinsicReward.mean": { |
| "value": 1.697591361043782, |
| "min": -1.0000000521540642, |
| "max": 1.7752850921230112, |
| "count": 100 |
| }, |
| "Pyramids.Policy.ExtrinsicReward.sum": { |
| "value": 196.92059788107872, |
| "min": -30.433601640164852, |
| "max": 250.3151979893446, |
| "count": 100 |
| }, |
| "Pyramids.Policy.RndReward.mean": { |
| "value": 0.017440856715626885, |
| "min": 0.01581837089132874, |
| "max": 9.29213576670736, |
| "count": 100 |
| }, |
| "Pyramids.Policy.RndReward.sum": { |
| "value": 2.0231393790127186, |
| "min": 1.9819676644983701, |
| "max": 148.67417226731777, |
| "count": 100 |
| }, |
| "Pyramids.IsTraining.mean": { |
| "value": 1.0, |
| "min": 1.0, |
| "max": 1.0, |
| "count": 100 |
| }, |
| "Pyramids.IsTraining.sum": { |
| "value": 1.0, |
| "min": 1.0, |
| "max": 1.0, |
| "count": 100 |
| } |
| }, |
| "metadata": { |
| "timer_format_version": "0.1.0", |
| "start_time_seconds": "1706728531", |
| "python_version": "3.10.12 (main, Nov 20 2023, 15:14:05) [GCC 11.4.0]", |
| "command_line_arguments": "/usr/local/bin/mlagents-learn ./config/ppo/PyramidsRND.yaml --env=./training-envs-executables/linux/Pyramids/Pyramids --run-id=Pyramids Training --no-graphics", |
| "mlagents_version": "1.1.0.dev0", |
| "mlagents_envs_version": "1.1.0.dev0", |
| "communication_protocol_version": "1.5.0", |
| "pytorch_version": "2.2.0+cu121", |
| "numpy_version": "1.23.5", |
| "end_time_seconds": "1706736123" |
| }, |
| "total": 7591.881738983, |
| "count": 1, |
| "self": 0.5082409179995011, |
| "children": { |
| "run_training.setup": { |
| "total": 0.051130151999586815, |
| "count": 1, |
| "self": 0.051130151999586815 |
| }, |
| "TrainerController.start_learning": { |
| "total": 7591.322367913001, |
| "count": 1, |
| "self": 4.580546740238788, |
| "children": { |
| "TrainerController._reset_env": { |
| "total": 3.188782046000142, |
| "count": 1, |
| "self": 3.188782046000142 |
| }, |
| "TrainerController.advance": { |
| "total": 7583.460988532762, |
| "count": 194613, |
| "self": 4.724775389248862, |
| "children": { |
| "env_step": { |
| "total": 5582.194257566906, |
| "count": 194613, |
| "self": 5157.444570339441, |
| "children": { |
| "SubprocessEnvManager._take_step": { |
| "total": 421.9881304117371, |
| "count": 194613, |
| "self": 15.415391997128609, |
| "children": { |
| "TorchPolicy.evaluate": { |
| "total": 406.57273841460847, |
| "count": 187563, |
| "self": 406.57273841460847 |
| } |
| } |
| }, |
| "workers": { |
| "total": 2.7615568157279995, |
| "count": 194613, |
| "self": 0.0, |
| "children": { |
| "worker_root": { |
| "total": 7574.286593487962, |
| "count": 194613, |
| "is_parallel": true, |
| "self": 2808.250156997893, |
| "children": { |
| "run_training.setup": { |
| "total": 0.0, |
| "count": 0, |
| "is_parallel": true, |
| "self": 0.0, |
| "children": { |
| "steps_from_proto": { |
| "total": 0.005371056000058161, |
| "count": 1, |
| "is_parallel": true, |
| "self": 0.003946133999306767, |
| "children": { |
| "_process_rank_one_or_two_observation": { |
| "total": 0.001424922000751394, |
| "count": 8, |
| "is_parallel": true, |
| "self": 0.001424922000751394 |
| } |
| } |
| }, |
| "UnityEnvironment.step": { |
| "total": 0.053897405000043364, |
| "count": 1, |
| "is_parallel": true, |
| "self": 0.0006992150001678965, |
| "children": { |
| "UnityEnvironment._generate_step_input": { |
| "total": 0.0005338639998626604, |
| "count": 1, |
| "is_parallel": true, |
| "self": 0.0005338639998626604 |
| }, |
| "communicator.exchange": { |
| "total": 0.050768492000315746, |
| "count": 1, |
| "is_parallel": true, |
| "self": 0.050768492000315746 |
| }, |
| "steps_from_proto": { |
| "total": 0.0018958339996970608, |
| "count": 1, |
| "is_parallel": true, |
| "self": 0.00040937699895948754, |
| "children": { |
| "_process_rank_one_or_two_observation": { |
| "total": 0.0014864570007375733, |
| "count": 8, |
| "is_parallel": true, |
| "self": 0.0014864570007375733 |
| } |
| } |
| } |
| } |
| } |
| } |
| }, |
| "UnityEnvironment.step": { |
| "total": 4766.036436490069, |
| "count": 194612, |
| "is_parallel": true, |
| "self": 111.07986765572969, |
| "children": { |
| "UnityEnvironment._generate_step_input": { |
| "total": 78.7007358669689, |
| "count": 194612, |
| "is_parallel": true, |
| "self": 78.7007358669689 |
| }, |
| "communicator.exchange": { |
| "total": 4250.520715371329, |
| "count": 194612, |
| "is_parallel": true, |
| "self": 4250.520715371329 |
| }, |
| "steps_from_proto": { |
| "total": 325.73511759604116, |
| "count": 194612, |
| "is_parallel": true, |
| "self": 67.39921052791487, |
| "children": { |
| "_process_rank_one_or_two_observation": { |
| "total": 258.3359070681263, |
| "count": 1556896, |
| "is_parallel": true, |
| "self": 258.3359070681263 |
| } |
| } |
| } |
| } |
| } |
| } |
| } |
| } |
| } |
| } |
| }, |
| "trainer_advance": { |
| "total": 1996.5419555766066, |
| "count": 194613, |
| "self": 9.159311783740577, |
| "children": { |
| "process_trajectory": { |
| "total": 416.15789446488, |
| "count": 194613, |
| "self": 415.5295719828782, |
| "children": { |
| "RLTrainer._checkpoint": { |
| "total": 0.6283224820017494, |
| "count": 6, |
| "self": 0.6283224820017494 |
| } |
| } |
| }, |
| "_update_policy": { |
| "total": 1571.224749327986, |
| "count": 1398, |
| "self": 930.3179039760244, |
| "children": { |
| "TorchPPOOptimizer.update": { |
| "total": 640.9068453519617, |
| "count": 68412, |
| "self": 640.9068453519617 |
| } |
| } |
| } |
| } |
| } |
| } |
| }, |
| "trainer_threads": { |
| "total": 1.0040002962341532e-06, |
| "count": 1, |
| "self": 1.0040002962341532e-06 |
| }, |
| "TrainerController._save_models": { |
| "total": 0.09204958999907831, |
| "count": 1, |
| "self": 0.001677372998528881, |
| "children": { |
| "RLTrainer._checkpoint": { |
| "total": 0.09037221700054943, |
| "count": 1, |
| "self": 0.09037221700054943 |
| } |
| } |
| } |
| } |
| } |
| } |
| } |