| { |
| "name": "root", |
| "gauges": { |
| "Pyramids.Policy.Entropy.mean": { |
| "value": 0.5354316830635071, |
| "min": 0.5354316830635071, |
| "max": 1.4879765510559082, |
| "count": 24 |
| }, |
| "Pyramids.Policy.Entropy.sum": { |
| "value": 16071.517578125, |
| "min": 16071.517578125, |
| "max": 45139.2578125, |
| "count": 24 |
| }, |
| "Pyramids.Step.mean": { |
| "value": 719967.0, |
| "min": 29965.0, |
| "max": 719967.0, |
| "count": 24 |
| }, |
| "Pyramids.Step.sum": { |
| "value": 719967.0, |
| "min": 29965.0, |
| "max": 719967.0, |
| "count": 24 |
| }, |
| "Pyramids.Policy.ExtrinsicValueEstimate.mean": { |
| "value": 0.46009257435798645, |
| "min": -0.1223444864153862, |
| "max": 0.46009257435798645, |
| "count": 24 |
| }, |
| "Pyramids.Policy.ExtrinsicValueEstimate.sum": { |
| "value": 124.2249984741211, |
| "min": -29.11798858642578, |
| "max": 124.2249984741211, |
| "count": 24 |
| }, |
| "Pyramids.Policy.RndValueEstimate.mean": { |
| "value": 0.021058104932308197, |
| "min": -0.012443069368600845, |
| "max": 0.4489564597606659, |
| "count": 24 |
| }, |
| "Pyramids.Policy.RndValueEstimate.sum": { |
| "value": 5.685688495635986, |
| "min": -3.2351980209350586, |
| "max": 106.85163879394531, |
| "count": 24 |
| }, |
| "Pyramids.Losses.PolicyLoss.mean": { |
| "value": 0.07148070406540119, |
| "min": 0.06517403315713939, |
| "max": 0.07585844562453523, |
| "count": 24 |
| }, |
| "Pyramids.Losses.PolicyLoss.sum": { |
| "value": 1.0007298569156167, |
| "min": 0.5154042914586715, |
| "max": 1.0817758405270674, |
| "count": 24 |
| }, |
| "Pyramids.Losses.ValueLoss.mean": { |
| "value": 0.01528131502328463, |
| "min": 0.0007489936297205103, |
| "max": 0.01528131502328463, |
| "count": 24 |
| }, |
| "Pyramids.Losses.ValueLoss.sum": { |
| "value": 0.21393841032598482, |
| "min": 0.008987923556646123, |
| "max": 0.21393841032598482, |
| "count": 24 |
| }, |
| "Pyramids.Policy.LearningRate.mean": { |
| "value": 0.00022950117349961665, |
| "min": 0.00022950117349961665, |
| "max": 0.0002984126148148429, |
| "count": 24 |
| }, |
| "Pyramids.Policy.LearningRate.sum": { |
| "value": 0.003213016428994633, |
| "min": 0.0020888883037039003, |
| "max": 0.0038853469048843988, |
| "count": 24 |
| }, |
| "Pyramids.Policy.Epsilon.mean": { |
| "value": 0.17650038333333332, |
| "min": 0.17650038333333332, |
| "max": 0.19947087142857142, |
| "count": 24 |
| }, |
| "Pyramids.Policy.Epsilon.sum": { |
| "value": 2.4710053666666663, |
| "min": 1.3962961, |
| "max": 2.7674782000000007, |
| "count": 24 |
| }, |
| "Pyramids.Policy.Beta.mean": { |
| "value": 0.007652388295, |
| "min": 0.007652388295, |
| "max": 0.009947140055714286, |
| "count": 24 |
| }, |
| "Pyramids.Policy.Beta.sum": { |
| "value": 0.10713343613, |
| "min": 0.06962998039, |
| "max": 0.12952204843999998, |
| "count": 24 |
| }, |
| "Pyramids.Losses.RNDLoss.mean": { |
| "value": 0.010132000781595707, |
| "min": 0.010132000781595707, |
| "max": 0.31084755063056946, |
| "count": 24 |
| }, |
| "Pyramids.Losses.RNDLoss.sum": { |
| "value": 0.14184801280498505, |
| "min": 0.14184801280498505, |
| "max": 2.1759328842163086, |
| "count": 24 |
| }, |
| "Pyramids.Environment.EpisodeLength.mean": { |
| "value": 421.72, |
| "min": 421.72, |
| "max": 999.0, |
| "count": 24 |
| }, |
| "Pyramids.Environment.EpisodeLength.sum": { |
| "value": 31629.0, |
| "min": 16636.0, |
| "max": 32708.0, |
| "count": 24 |
| }, |
| "Pyramids.Environment.CumulativeReward.mean": { |
| "value": 1.5249386477470397, |
| "min": -0.999987552408129, |
| "max": 1.5249386477470397, |
| "count": 24 |
| }, |
| "Pyramids.Environment.CumulativeReward.sum": { |
| "value": 114.37039858102798, |
| "min": -31.999601677060127, |
| "max": 114.37039858102798, |
| "count": 24 |
| }, |
| "Pyramids.Policy.ExtrinsicReward.mean": { |
| "value": 1.5249386477470397, |
| "min": -0.999987552408129, |
| "max": 1.5249386477470397, |
| "count": 24 |
| }, |
| "Pyramids.Policy.ExtrinsicReward.sum": { |
| "value": 114.37039858102798, |
| "min": -31.999601677060127, |
| "max": 114.37039858102798, |
| "count": 24 |
| }, |
| "Pyramids.Policy.RndReward.mean": { |
| "value": 0.04477264853582407, |
| "min": 0.04477264853582407, |
| "max": 5.834203359177884, |
| "count": 24 |
| }, |
| "Pyramids.Policy.RndReward.sum": { |
| "value": 3.3579486401868053, |
| "min": 3.200345461082179, |
| "max": 99.18145710602403, |
| "count": 24 |
| }, |
| "Pyramids.IsTraining.mean": { |
| "value": 1.0, |
| "min": 1.0, |
| "max": 1.0, |
| "count": 24 |
| }, |
| "Pyramids.IsTraining.sum": { |
| "value": 1.0, |
| "min": 1.0, |
| "max": 1.0, |
| "count": 24 |
| } |
| }, |
| "metadata": { |
| "timer_format_version": "0.1.0", |
| "start_time_seconds": "1690474902", |
| "python_version": "3.8.16 (default, Jun 12 2023, 18:09:05) \n[GCC 11.2.0]", |
| "command_line_arguments": "/global/home/users/lizhen/scratch/miniconda3/envs/huggingface/bin/mlagents-learn ../ml-agents/config/ppo/PyramidsRND.yaml --env=./training-envs-executables/linux/Pyramids/Pyramids --run-id=Pyramids Training --no-graphics", |
| "mlagents_version": "0.31.0.dev0", |
| "mlagents_envs_version": "0.31.0.dev0", |
| "communication_protocol_version": "1.5.0", |
| "pytorch_version": "1.8.1+cu102", |
| "numpy_version": "1.21.2", |
| "end_time_seconds": "1690476910" |
| }, |
| "total": 2007.4402644950023, |
| "count": 1, |
| "self": 0.019585551985073835, |
| "children": { |
| "run_training.setup": { |
| "total": 0.0628495890123304, |
| "count": 1, |
| "self": 0.0628495890123304 |
| }, |
| "TrainerController.start_learning": { |
| "total": 2007.357829354005, |
| "count": 1, |
| "self": 0.9330457296455279, |
| "children": { |
| "TrainerController._reset_env": { |
| "total": 17.90129806101322, |
| "count": 1, |
| "self": 17.90129806101322 |
| }, |
| "TrainerController.advance": { |
| "total": 1986.292932489363, |
| "count": 47287, |
| "self": 0.8639501665020362, |
| "children": { |
| "env_step": { |
| "total": 1415.4523650843475, |
| "count": 47287, |
| "self": 1341.8168204505346, |
| "children": { |
| "SubprocessEnvManager._take_step": { |
| "total": 73.07705894342507, |
| "count": 47287, |
| "self": 3.1242650105268694, |
| "children": { |
| "TorchPolicy.evaluate": { |
| "total": 69.9527939328982, |
| "count": 46550, |
| "self": 69.9527939328982 |
| } |
| } |
| }, |
| "workers": { |
| "total": 0.5584856903878972, |
| "count": 47286, |
| "self": 0.0, |
| "children": { |
| "worker_root": { |
| "total": 2001.7802101577108, |
| "count": 47286, |
| "is_parallel": true, |
| "self": 753.0852439897717, |
| "children": { |
| "run_training.setup": { |
| "total": 0.0, |
| "count": 0, |
| "is_parallel": true, |
| "self": 0.0, |
| "children": { |
| "steps_from_proto": { |
| "total": 0.013564358989242464, |
| "count": 1, |
| "is_parallel": true, |
| "self": 0.002854533988283947, |
| "children": { |
| "_process_rank_one_or_two_observation": { |
| "total": 0.010709825000958517, |
| "count": 8, |
| "is_parallel": true, |
| "self": 0.010709825000958517 |
| } |
| } |
| }, |
| "UnityEnvironment.step": { |
| "total": 0.06518930001766421, |
| "count": 1, |
| "is_parallel": true, |
| "self": 0.0010782770114019513, |
| "children": { |
| "UnityEnvironment._generate_step_input": { |
| "total": 0.0008892060141079128, |
| "count": 1, |
| "is_parallel": true, |
| "self": 0.0008892060141079128 |
| }, |
| "communicator.exchange": { |
| "total": 0.05995043198345229, |
| "count": 1, |
| "is_parallel": true, |
| "self": 0.05995043198345229 |
| }, |
| "steps_from_proto": { |
| "total": 0.0032713850087020546, |
| "count": 1, |
| "is_parallel": true, |
| "self": 0.0007223400461953133, |
| "children": { |
| "_process_rank_one_or_two_observation": { |
| "total": 0.0025490449625067413, |
| "count": 8, |
| "is_parallel": true, |
| "self": 0.0025490449625067413 |
| } |
| } |
| } |
| } |
| } |
| } |
| }, |
| "UnityEnvironment.step": { |
| "total": 1248.6949661679391, |
| "count": 47285, |
| "is_parallel": true, |
| "self": 44.633973296004115, |
| "children": { |
| "UnityEnvironment._generate_step_input": { |
| "total": 33.083338855649345, |
| "count": 47285, |
| "is_parallel": true, |
| "self": 33.083338855649345 |
| }, |
| "communicator.exchange": { |
| "total": 1047.8523495950503, |
| "count": 47285, |
| "is_parallel": true, |
| "self": 1047.8523495950503 |
| }, |
| "steps_from_proto": { |
| "total": 123.12530442123534, |
| "count": 47285, |
| "is_parallel": true, |
| "self": 26.948400199238677, |
| "children": { |
| "_process_rank_one_or_two_observation": { |
| "total": 96.17690422199667, |
| "count": 378280, |
| "is_parallel": true, |
| "self": 96.17690422199667 |
| } |
| } |
| } |
| } |
| } |
| } |
| } |
| } |
| } |
| } |
| }, |
| "trainer_advance": { |
| "total": 569.9766172385134, |
| "count": 47286, |
| "self": 1.657787573582027, |
| "children": { |
| "process_trajectory": { |
| "total": 71.81227012249292, |
| "count": 47286, |
| "self": 71.64519006150658, |
| "children": { |
| "RLTrainer._checkpoint": { |
| "total": 0.16708006098633632, |
| "count": 1, |
| "self": 0.16708006098633632 |
| } |
| } |
| }, |
| "_update_policy": { |
| "total": 496.5065595424385, |
| "count": 330, |
| "self": 251.4980613142252, |
| "children": { |
| "TorchPPOOptimizer.update": { |
| "total": 245.00849822821328, |
| "count": 16938, |
| "self": 245.00849822821328 |
| } |
| } |
| } |
| } |
| } |
| } |
| }, |
| "trainer_threads": { |
| "total": 3.762979758903384e-06, |
| "count": 1, |
| "self": 3.762979758903384e-06 |
| }, |
| "TrainerController._save_models": { |
| "total": 2.230549311003415, |
| "count": 1, |
| "self": 0.017922976025147364, |
| "children": { |
| "RLTrainer._checkpoint": { |
| "total": 2.2126263349782676, |
| "count": 1, |
| "self": 2.2126263349782676 |
| } |
| } |
| } |
| } |
| } |
| } |
| } |