| { |
| "name": "root", |
| "gauges": { |
| "Pyramids.Policy.Entropy.mean": { |
| "value": 0.40372198820114136, |
| "min": 0.3707912564277649, |
| "max": 1.4556697607040405, |
| "count": 33 |
| }, |
| "Pyramids.Policy.Entropy.sum": { |
| "value": 12163.3359375, |
| "min": 11117.8046875, |
| "max": 44159.19921875, |
| "count": 33 |
| }, |
| "Pyramids.Step.mean": { |
| "value": 989942.0, |
| "min": 29952.0, |
| "max": 989942.0, |
| "count": 33 |
| }, |
| "Pyramids.Step.sum": { |
| "value": 989942.0, |
| "min": 29952.0, |
| "max": 989942.0, |
| "count": 33 |
| }, |
| "Pyramids.Policy.ExtrinsicValueEstimate.mean": { |
| "value": 0.48312079906463623, |
| "min": -0.12045388668775558, |
| "max": 0.5584696531295776, |
| "count": 33 |
| }, |
| "Pyramids.Policy.ExtrinsicValueEstimate.sum": { |
| "value": 128.99325561523438, |
| "min": -29.029386520385742, |
| "max": 158.04690551757812, |
| "count": 33 |
| }, |
| "Pyramids.Policy.RndValueEstimate.mean": { |
| "value": 0.01817130297422409, |
| "min": 0.005104883573949337, |
| "max": 0.6336129903793335, |
| "count": 33 |
| }, |
| "Pyramids.Policy.RndValueEstimate.sum": { |
| "value": 4.851737976074219, |
| "min": 1.2506964206695557, |
| "max": 150.16627502441406, |
| "count": 33 |
| }, |
| "Pyramids.Losses.PolicyLoss.mean": { |
| "value": 0.06641971863314716, |
| "min": 0.06579809887279268, |
| "max": 0.07317178811557905, |
| "count": 33 |
| }, |
| "Pyramids.Losses.PolicyLoss.sum": { |
| "value": 0.9962957794972075, |
| "min": 0.505382156863624, |
| "max": 1.0560386154102162, |
| "count": 33 |
| }, |
| "Pyramids.Losses.ValueLoss.mean": { |
| "value": 0.01461627717007003, |
| "min": 0.00025806463729980973, |
| "max": 0.021735412348069565, |
| "count": 33 |
| }, |
| "Pyramids.Losses.ValueLoss.sum": { |
| "value": 0.21924415755105045, |
| "min": 0.003612904922197336, |
| "max": 0.22101005170649538, |
| "count": 33 |
| }, |
| "Pyramids.Policy.LearningRate.mean": { |
| "value": 7.514197495300002e-06, |
| "min": 7.514197495300002e-06, |
| "max": 0.00029515063018788575, |
| "count": 33 |
| }, |
| "Pyramids.Policy.LearningRate.sum": { |
| "value": 0.00011271296242950003, |
| "min": 0.00011271296242950003, |
| "max": 0.0036325057891648, |
| "count": 33 |
| }, |
| "Pyramids.Policy.Epsilon.mean": { |
| "value": 0.10250470000000003, |
| "min": 0.10250470000000003, |
| "max": 0.19838354285714285, |
| "count": 33 |
| }, |
| "Pyramids.Policy.Epsilon.sum": { |
| "value": 1.5375705000000004, |
| "min": 1.3886848, |
| "max": 2.6108352000000004, |
| "count": 33 |
| }, |
| "Pyramids.Policy.Beta.mean": { |
| "value": 0.00026021953000000006, |
| "min": 0.00026021953000000006, |
| "max": 0.00983851593142857, |
| "count": 33 |
| }, |
| "Pyramids.Policy.Beta.sum": { |
| "value": 0.003903292950000001, |
| "min": 0.003903292950000001, |
| "max": 0.12110243648, |
| "count": 33 |
| }, |
| "Pyramids.Losses.RNDLoss.mean": { |
| "value": 0.015856942161917686, |
| "min": 0.015856942161917686, |
| "max": 0.6128483414649963, |
| "count": 33 |
| }, |
| "Pyramids.Losses.RNDLoss.sum": { |
| "value": 0.23785413801670074, |
| "min": 0.22693490982055664, |
| "max": 4.289938449859619, |
| "count": 33 |
| }, |
| "Pyramids.Environment.EpisodeLength.mean": { |
| "value": 377.9078947368421, |
| "min": 303.1443298969072, |
| "max": 999.0, |
| "count": 33 |
| }, |
| "Pyramids.Environment.EpisodeLength.sum": { |
| "value": 28721.0, |
| "min": 15984.0, |
| "max": 33368.0, |
| "count": 33 |
| }, |
| "Pyramids.Environment.CumulativeReward.mean": { |
| "value": 1.5170026530822118, |
| "min": -1.0000000521540642, |
| "max": 1.6762309146603358, |
| "count": 33 |
| }, |
| "Pyramids.Environment.CumulativeReward.sum": { |
| "value": 113.77519898116589, |
| "min": -30.40620169788599, |
| "max": 162.59439872205257, |
| "count": 33 |
| }, |
| "Pyramids.Policy.ExtrinsicReward.mean": { |
| "value": 1.5170026530822118, |
| "min": -1.0000000521540642, |
| "max": 1.6762309146603358, |
| "count": 33 |
| }, |
| "Pyramids.Policy.ExtrinsicReward.sum": { |
| "value": 113.77519898116589, |
| "min": -30.40620169788599, |
| "max": 162.59439872205257, |
| "count": 33 |
| }, |
| "Pyramids.Policy.RndReward.mean": { |
| "value": 0.06242571748249854, |
| "min": 0.05358445981127983, |
| "max": 13.34334221854806, |
| "count": 33 |
| }, |
| "Pyramids.Policy.RndReward.sum": { |
| "value": 4.68192881118739, |
| "min": 4.68192881118739, |
| "max": 213.49347549676895, |
| "count": 33 |
| }, |
| "Pyramids.IsTraining.mean": { |
| "value": 1.0, |
| "min": 1.0, |
| "max": 1.0, |
| "count": 33 |
| }, |
| "Pyramids.IsTraining.sum": { |
| "value": 1.0, |
| "min": 1.0, |
| "max": 1.0, |
| "count": 33 |
| } |
| }, |
| "metadata": { |
| "timer_format_version": "0.1.0", |
| "start_time_seconds": "1699561951", |
| "python_version": "3.10.12 (main, Jun 11 2023, 05:26:28) [GCC 11.4.0]", |
| "command_line_arguments": "/usr/local/bin/mlagents-learn ./config/ppo/PyramidsRND.yaml --env=./training-envs-executables/linux/Pyramids/Pyramids --run-id=Pyramids Training --no-graphics", |
| "mlagents_version": "1.1.0.dev0", |
| "mlagents_envs_version": "1.1.0.dev0", |
| "communication_protocol_version": "1.5.0", |
| "pytorch_version": "2.1.0+cu118", |
| "numpy_version": "1.23.5", |
| "end_time_seconds": "1699564167" |
| }, |
| "total": 2216.238286706, |
| "count": 1, |
| "self": 0.47654615500005093, |
| "children": { |
| "run_training.setup": { |
| "total": 0.04511496999998599, |
| "count": 1, |
| "self": 0.04511496999998599 |
| }, |
| "TrainerController.start_learning": { |
| "total": 2215.716625581, |
| "count": 1, |
| "self": 1.2220533800077646, |
| "children": { |
| "TrainerController._reset_env": { |
| "total": 8.93151507399989, |
| "count": 1, |
| "self": 8.93151507399989 |
| }, |
| "TrainerController.advance": { |
| "total": 2205.486150846992, |
| "count": 63695, |
| "self": 1.3049954610214627, |
| "children": { |
| "env_step": { |
| "total": 1580.526663182951, |
| "count": 63695, |
| "self": 1453.0760863549822, |
| "children": { |
| "SubprocessEnvManager._take_step": { |
| "total": 126.68077171797495, |
| "count": 63695, |
| "self": 4.621322425028893, |
| "children": { |
| "TorchPolicy.evaluate": { |
| "total": 122.05944929294606, |
| "count": 62558, |
| "self": 122.05944929294606 |
| } |
| } |
| }, |
| "workers": { |
| "total": 0.7698051099939676, |
| "count": 63695, |
| "self": 0.0, |
| "children": { |
| "worker_root": { |
| "total": 2211.231235368969, |
| "count": 63695, |
| "is_parallel": true, |
| "self": 867.8587928839845, |
| "children": { |
| "run_training.setup": { |
| "total": 0.0, |
| "count": 0, |
| "is_parallel": true, |
| "self": 0.0, |
| "children": { |
| "steps_from_proto": { |
| "total": 0.005095142000072883, |
| "count": 1, |
| "is_parallel": true, |
| "self": 0.003562445000397929, |
| "children": { |
| "_process_rank_one_or_two_observation": { |
| "total": 0.001532696999674954, |
| "count": 8, |
| "is_parallel": true, |
| "self": 0.001532696999674954 |
| } |
| } |
| }, |
| "UnityEnvironment.step": { |
| "total": 0.04986780800004453, |
| "count": 1, |
| "is_parallel": true, |
| "self": 0.0006248610000056942, |
| "children": { |
| "UnityEnvironment._generate_step_input": { |
| "total": 0.0004741630000353325, |
| "count": 1, |
| "is_parallel": true, |
| "self": 0.0004741630000353325 |
| }, |
| "communicator.exchange": { |
| "total": 0.04719653400002244, |
| "count": 1, |
| "is_parallel": true, |
| "self": 0.04719653400002244 |
| }, |
| "steps_from_proto": { |
| "total": 0.001572249999981068, |
| "count": 1, |
| "is_parallel": true, |
| "self": 0.0003394589998606534, |
| "children": { |
| "_process_rank_one_or_two_observation": { |
| "total": 0.0012327910001204145, |
| "count": 8, |
| "is_parallel": true, |
| "self": 0.0012327910001204145 |
| } |
| } |
| } |
| } |
| } |
| } |
| }, |
| "UnityEnvironment.step": { |
| "total": 1343.3724424849845, |
| "count": 63694, |
| "is_parallel": true, |
| "self": 34.690201781023006, |
| "children": { |
| "UnityEnvironment._generate_step_input": { |
| "total": 23.850148585025636, |
| "count": 63694, |
| "is_parallel": true, |
| "self": 23.850148585025636 |
| }, |
| "communicator.exchange": { |
| "total": 1187.430589418954, |
| "count": 63694, |
| "is_parallel": true, |
| "self": 1187.430589418954 |
| }, |
| "steps_from_proto": { |
| "total": 97.40150269998185, |
| "count": 63694, |
| "is_parallel": true, |
| "self": 18.943393323022065, |
| "children": { |
| "_process_rank_one_or_two_observation": { |
| "total": 78.45810937695978, |
| "count": 509552, |
| "is_parallel": true, |
| "self": 78.45810937695978 |
| } |
| } |
| } |
| } |
| } |
| } |
| } |
| } |
| } |
| } |
| }, |
| "trainer_advance": { |
| "total": 623.6544922030193, |
| "count": 63695, |
| "self": 2.3886360759681793, |
| "children": { |
| "process_trajectory": { |
| "total": 119.7939376970412, |
| "count": 63695, |
| "self": 119.58311027904165, |
| "children": { |
| "RLTrainer._checkpoint": { |
| "total": 0.2108274179995533, |
| "count": 2, |
| "self": 0.2108274179995533 |
| } |
| } |
| }, |
| "_update_policy": { |
| "total": 501.47191843000996, |
| "count": 453, |
| "self": 300.3981185300297, |
| "children": { |
| "TorchPPOOptimizer.update": { |
| "total": 201.07379989998026, |
| "count": 22788, |
| "self": 201.07379989998026 |
| } |
| } |
| } |
| } |
| } |
| } |
| }, |
| "trainer_threads": { |
| "total": 1.0600001587590668e-06, |
| "count": 1, |
| "self": 1.0600001587590668e-06 |
| }, |
| "TrainerController._save_models": { |
| "total": 0.07690521999984412, |
| "count": 1, |
| "self": 0.0013572259995271452, |
| "children": { |
| "RLTrainer._checkpoint": { |
| "total": 0.07554799400031698, |
| "count": 1, |
| "self": 0.07554799400031698 |
| } |
| } |
| } |
| } |
| } |
| } |
| } |