{ "name": "root", "gauges": { "Pyramids.Policy.Entropy.mean": { "value": 0.18083599209785461, "min": 0.1753084659576416, "max": 1.5017955303192139, "count": 100 }, "Pyramids.Policy.Entropy.sum": { "value": 5436.6533203125, "min": 5249.01318359375, "max": 45558.46875, "count": 100 }, "Pyramids.Step.mean": { "value": 2999984.0, "min": 29952.0, "max": 2999984.0, "count": 100 }, "Pyramids.Step.sum": { "value": 2999984.0, "min": 29952.0, "max": 2999984.0, "count": 100 }, "Pyramids.Policy.ExtrinsicValueEstimate.mean": { "value": 0.6283080577850342, "min": -0.1075344979763031, "max": 0.710053563117981, "count": 100 }, "Pyramids.Policy.ExtrinsicValueEstimate.sum": { "value": 182.20933532714844, "min": -25.808279037475586, "max": 206.62559509277344, "count": 100 }, "Pyramids.Policy.RndValueEstimate.mean": { "value": 0.013113018125295639, "min": -0.045015666633844376, "max": 0.2258395403623581, "count": 100 }, "Pyramids.Policy.RndValueEstimate.sum": { "value": 3.8027751445770264, "min": -12.244261741638184, "max": 53.52397155761719, "count": 100 }, "Pyramids.Losses.PolicyLoss.mean": { "value": 0.06543375354577168, "min": 0.06533164033850986, "max": 0.07680259531834888, "count": 100 }, "Pyramids.Losses.PolicyLoss.sum": { "value": 0.9160725496408034, "min": 0.49085674155436604, "max": 1.1051700265767672, "count": 100 }, "Pyramids.Losses.ValueLoss.mean": { "value": 0.014990372544811439, "min": 5.436072959934471e-05, "max": 0.016239398962560308, "count": 100 }, "Pyramids.Losses.ValueLoss.sum": { "value": 0.20986521562736016, "min": 0.0006523287551921365, "max": 0.23327813882982204, "count": 100 }, "Pyramids.Policy.LearningRate.mean": { "value": 1.4828137914761926e-06, "min": 1.4828137914761926e-06, "max": 0.00029838354339596195, "count": 100 }, "Pyramids.Policy.LearningRate.sum": { "value": 2.0759393080666696e-05, "min": 2.0759393080666696e-05, "max": 0.0036750671749776658, "count": 100 }, "Pyramids.Policy.Epsilon.mean": { "value": 0.10049423809523808, "min": 0.10049423809523808, "max": 0.19946118095238097, "count": 100 }, "Pyramids.Policy.Epsilon.sum": { "value": 1.4069193333333332, "min": 1.3897045333333333, "max": 2.6774543, "count": 100 }, "Pyramids.Policy.Beta.mean": { "value": 5.937438571428578e-05, "min": 5.937438571428578e-05, "max": 0.009946171977142856, "count": 100 }, "Pyramids.Policy.Beta.sum": { "value": 0.0008312414000000009, "min": 0.0008312414000000009, "max": 0.12251973110000003, "count": 100 }, "Pyramids.Losses.RNDLoss.mean": { "value": 0.002524538431316614, "min": 0.002524538431316614, "max": 0.31970641016960144, "count": 100 }, "Pyramids.Losses.RNDLoss.sum": { "value": 0.03534353896975517, "min": 0.03534353896975517, "max": 2.2379448413848877, "count": 100 }, "Pyramids.Environment.EpisodeLength.mean": { "value": 295.1509433962264, "min": 257.070796460177, "max": 999.0, "count": 100 }, "Pyramids.Environment.EpisodeLength.sum": { "value": 31286.0, "min": 15984.0, "max": 33219.0, "count": 100 }, "Pyramids.Environment.CumulativeReward.mean": { "value": 1.64823017079594, "min": -1.0000000521540642, "max": 1.7397192809403987, "count": 100 }, "Pyramids.Environment.CumulativeReward.sum": { "value": 174.71239810436964, "min": -32.000001668930054, "max": 198.32799802720547, "count": 100 }, "Pyramids.Policy.ExtrinsicReward.mean": { "value": 1.64823017079594, "min": -1.0000000521540642, "max": 1.7397192809403987, "count": 100 }, "Pyramids.Policy.ExtrinsicReward.sum": { "value": 174.71239810436964, "min": -32.000001668930054, "max": 198.32799802720547, "count": 100 }, "Pyramids.Policy.RndReward.mean": { "value": 0.007778382844130733, "min": 0.007355977590729405, "max": 6.568125128746033, "count": 100 }, "Pyramids.Policy.RndReward.sum": { "value": 0.8245085814778577, "min": 0.7868847954487137, "max": 105.09000205993652, "count": 100 }, "Pyramids.IsTraining.mean": { "value": 1.0, "min": 1.0, "max": 1.0, "count": 100 }, "Pyramids.IsTraining.sum": { "value": 1.0, "min": 1.0, "max": 1.0, "count": 100 } }, "metadata": { "timer_format_version": "0.1.0", "start_time_seconds": "1771817183", "python_version": "3.10.12 (main, Jul 5 2023, 18:54:27) [GCC 11.2.0]", "command_line_arguments": "/usr/local/envs/mlagents_env/bin/mlagents-learn /content/ml-agents/config/ppo/PyramidsRND.yaml --env=./training-envs-executables/linux/Pyramids/Pyramids --run-id=Pyramids Training --no-graphics", "mlagents_version": "1.2.0.dev0", "mlagents_envs_version": "1.2.0.dev0", "communication_protocol_version": "1.5.0", "pytorch_version": "2.8.0+cu128", "numpy_version": "1.23.5", "end_time_seconds": "1771824291" }, "total": 7107.776239903, "count": 1, "self": 0.5264534219995767, "children": { "run_training.setup": { "total": 0.01900760100033949, "count": 1, "self": 0.01900760100033949 }, "TrainerController.start_learning": { "total": 7107.23077888, "count": 1, "self": 4.64455457547956, "children": { "TrainerController._reset_env": { "total": 2.0930156269996587, "count": 1, "self": 2.0930156269996587 }, "TrainerController.advance": { "total": 7100.415967424522, "count": 193200, "self": 4.922077457418709, "children": { "env_step": { "total": 5076.800874323141, "count": 193200, "self": 4588.924436536091, "children": { "SubprocessEnvManager._take_step": { "total": 485.0967085192651, "count": 193200, "self": 14.74740999003734, "children": { "TorchPolicy.evaluate": { "total": 470.3492985292278, "count": 187557, "self": 470.3492985292278 } } }, "workers": { "total": 2.7797292677851146, "count": 193200, "self": 0.0, "children": { "worker_root": { "total": 7088.043072083577, "count": 193200, "is_parallel": true, "self": 2874.006202681652, "children": { "run_training.setup": { "total": 0.0, "count": 0, "is_parallel": true, "self": 0.0, "children": { "steps_from_proto": { "total": 0.0019067630000790814, "count": 1, "is_parallel": true, "self": 0.0006636380003328668, "children": { "_process_rank_one_or_two_observation": { "total": 0.0012431249997462146, "count": 8, "is_parallel": true, "self": 0.0012431249997462146 } } }, "UnityEnvironment.step": { "total": 0.04939114300032088, "count": 1, "is_parallel": true, "self": 0.0006225080005606287, "children": { "UnityEnvironment._generate_step_input": { "total": 0.0005004570002711262, "count": 1, "is_parallel": true, "self": 0.0005004570002711262 }, "communicator.exchange": { "total": 0.04644637999990664, "count": 1, "is_parallel": true, "self": 0.04644637999990664 }, "steps_from_proto": { "total": 0.0018217979995824862, "count": 1, "is_parallel": true, "self": 0.00039283499972952995, "children": { "_process_rank_one_or_two_observation": { "total": 0.0014289629998529563, "count": 8, "is_parallel": true, "self": 0.0014289629998529563 } } } } } } }, "UnityEnvironment.step": { "total": 4214.036869401924, "count": 193199, "is_parallel": true, "self": 106.85728159333121, "children": { "UnityEnvironment._generate_step_input": { "total": 75.00446174797798, "count": 193199, "is_parallel": true, "self": 75.00446174797798 }, "communicator.exchange": { "total": 3688.72128981442, "count": 193199, "is_parallel": true, "self": 3688.72128981442 }, "steps_from_proto": { "total": 343.45383624619535, "count": 193199, "is_parallel": true, "self": 72.49425999826599, "children": { "_process_rank_one_or_two_observation": { "total": 270.95957624792936, "count": 1545592, "is_parallel": true, "self": 270.95957624792936 } } } } } } } } } } }, "trainer_advance": { "total": 2018.693015643962, "count": 193200, "self": 8.837307861845147, "children": { "process_trajectory": { "total": 397.01164160717144, "count": 193200, "self": 396.39577367117, "children": { "RLTrainer._checkpoint": { "total": 0.6158679360014503, "count": 6, "self": 0.6158679360014503 } } }, "_update_policy": { "total": 1612.8440661749455, "count": 1374, "self": 886.0230709779626, "children": { "TorchPPOOptimizer.update": { "total": 726.820995196983, "count": 68463, "self": 726.820995196983 } } } } } } }, "trainer_threads": { "total": 1.0159983503399417e-06, "count": 1, "self": 1.0159983503399417e-06 }, "TrainerController._save_models": { "total": 0.07724023700029647, "count": 1, "self": 0.0010557690002315212, "children": { "RLTrainer._checkpoint": { "total": 0.07618446800006495, "count": 1, "self": 0.07618446800006495 } } } } } } }