dev

45eec8a over 2 years ago

18.8 kB

	{
	"name": "root",
	"gauges": {
	"Pyramids.Policy.Entropy.mean": {
	"value": 0.5354316830635071,
	"min": 0.5354316830635071,
	"max": 1.4879765510559082,
	"count": 24
	},
	"Pyramids.Policy.Entropy.sum": {
	"value": 16071.517578125,
	"min": 16071.517578125,
	"max": 45139.2578125,
	"count": 24
	},
	"Pyramids.Step.mean": {
	"value": 719967.0,
	"min": 29965.0,
	"max": 719967.0,
	"count": 24
	},
	"Pyramids.Step.sum": {
	"value": 719967.0,
	"min": 29965.0,
	"max": 719967.0,
	"count": 24
	},
	"Pyramids.Policy.ExtrinsicValueEstimate.mean": {
	"value": 0.46009257435798645,
	"min": -0.1223444864153862,
	"max": 0.46009257435798645,
	"count": 24
	},
	"Pyramids.Policy.ExtrinsicValueEstimate.sum": {
	"value": 124.2249984741211,
	"min": -29.11798858642578,
	"max": 124.2249984741211,
	"count": 24
	},
	"Pyramids.Policy.RndValueEstimate.mean": {
	"value": 0.021058104932308197,
	"min": -0.012443069368600845,
	"max": 0.4489564597606659,
	"count": 24
	},
	"Pyramids.Policy.RndValueEstimate.sum": {
	"value": 5.685688495635986,
	"min": -3.2351980209350586,
	"max": 106.85163879394531,
	"count": 24
	},
	"Pyramids.Losses.PolicyLoss.mean": {
	"value": 0.07148070406540119,
	"min": 0.06517403315713939,
	"max": 0.07585844562453523,
	"count": 24
	},
	"Pyramids.Losses.PolicyLoss.sum": {
	"value": 1.0007298569156167,
	"min": 0.5154042914586715,
	"max": 1.0817758405270674,
	"count": 24
	},
	"Pyramids.Losses.ValueLoss.mean": {
	"value": 0.01528131502328463,
	"min": 0.0007489936297205103,
	"max": 0.01528131502328463,
	"count": 24
	},
	"Pyramids.Losses.ValueLoss.sum": {
	"value": 0.21393841032598482,
	"min": 0.008987923556646123,
	"max": 0.21393841032598482,
	"count": 24
	},
	"Pyramids.Policy.LearningRate.mean": {
	"value": 0.00022950117349961665,
	"min": 0.00022950117349961665,
	"max": 0.0002984126148148429,
	"count": 24
	},
	"Pyramids.Policy.LearningRate.sum": {
	"value": 0.003213016428994633,
	"min": 0.0020888883037039003,
	"max": 0.0038853469048843988,
	"count": 24
	},
	"Pyramids.Policy.Epsilon.mean": {
	"value": 0.17650038333333332,
	"min": 0.17650038333333332,
	"max": 0.19947087142857142,
	"count": 24
	},
	"Pyramids.Policy.Epsilon.sum": {
	"value": 2.4710053666666663,
	"min": 1.3962961,
	"max": 2.7674782000000007,
	"count": 24
	},
	"Pyramids.Policy.Beta.mean": {
	"value": 0.007652388295,
	"min": 0.007652388295,
	"max": 0.009947140055714286,
	"count": 24
	},
	"Pyramids.Policy.Beta.sum": {
	"value": 0.10713343613,
	"min": 0.06962998039,
	"max": 0.12952204843999998,
	"count": 24
	},
	"Pyramids.Losses.RNDLoss.mean": {
	"value": 0.010132000781595707,
	"min": 0.010132000781595707,
	"max": 0.31084755063056946,
	"count": 24
	},
	"Pyramids.Losses.RNDLoss.sum": {
	"value": 0.14184801280498505,
	"min": 0.14184801280498505,
	"max": 2.1759328842163086,
	"count": 24
	},
	"Pyramids.Environment.EpisodeLength.mean": {
	"value": 421.72,
	"min": 421.72,
	"max": 999.0,
	"count": 24
	},
	"Pyramids.Environment.EpisodeLength.sum": {
	"value": 31629.0,
	"min": 16636.0,
	"max": 32708.0,
	"count": 24
	},
	"Pyramids.Environment.CumulativeReward.mean": {
	"value": 1.5249386477470397,
	"min": -0.999987552408129,
	"max": 1.5249386477470397,
	"count": 24
	},
	"Pyramids.Environment.CumulativeReward.sum": {
	"value": 114.37039858102798,
	"min": -31.999601677060127,
	"max": 114.37039858102798,
	"count": 24
	},
	"Pyramids.Policy.ExtrinsicReward.mean": {
	"value": 1.5249386477470397,
	"min": -0.999987552408129,
	"max": 1.5249386477470397,
	"count": 24
	},
	"Pyramids.Policy.ExtrinsicReward.sum": {
	"value": 114.37039858102798,
	"min": -31.999601677060127,
	"max": 114.37039858102798,
	"count": 24
	},
	"Pyramids.Policy.RndReward.mean": {
	"value": 0.04477264853582407,
	"min": 0.04477264853582407,
	"max": 5.834203359177884,
	"count": 24
	},
	"Pyramids.Policy.RndReward.sum": {
	"value": 3.3579486401868053,
	"min": 3.200345461082179,
	"max": 99.18145710602403,
	"count": 24
	},
	"Pyramids.IsTraining.mean": {
	"value": 1.0,
	"min": 1.0,
	"max": 1.0,
	"count": 24
	},
	"Pyramids.IsTraining.sum": {
	"value": 1.0,
	"min": 1.0,
	"max": 1.0,
	"count": 24
	}
	},
	"metadata": {
	"timer_format_version": "0.1.0",
	"start_time_seconds": "1690474902",
	"python_version": "3.8.16 (default, Jun 12 2023, 18:09:05) \n[GCC 11.2.0]",
	"command_line_arguments": "/global/home/users/lizhen/scratch/miniconda3/envs/huggingface/bin/mlagents-learn ../ml-agents/config/ppo/PyramidsRND.yaml --env=./training-envs-executables/linux/Pyramids/Pyramids --run-id=Pyramids Training --no-graphics",
	"mlagents_version": "0.31.0.dev0",
	"mlagents_envs_version": "0.31.0.dev0",
	"communication_protocol_version": "1.5.0",
	"pytorch_version": "1.8.1+cu102",
	"numpy_version": "1.21.2",
	"end_time_seconds": "1690476910"
	},
	"total": 2007.4402644950023,
	"count": 1,
	"self": 0.019585551985073835,
	"children": {
	"run_training.setup": {
	"total": 0.0628495890123304,
	"count": 1,
	"self": 0.0628495890123304
	},
	"TrainerController.start_learning": {
	"total": 2007.357829354005,
	"count": 1,
	"self": 0.9330457296455279,
	"children": {
	"TrainerController._reset_env": {
	"total": 17.90129806101322,
	"count": 1,
	"self": 17.90129806101322
	},
	"TrainerController.advance": {
	"total": 1986.292932489363,
	"count": 47287,
	"self": 0.8639501665020362,
	"children": {
	"env_step": {
	"total": 1415.4523650843475,
	"count": 47287,
	"self": 1341.8168204505346,
	"children": {
	"SubprocessEnvManager._take_step": {
	"total": 73.07705894342507,
	"count": 47287,
	"self": 3.1242650105268694,
	"children": {
	"TorchPolicy.evaluate": {
	"total": 69.9527939328982,
	"count": 46550,
	"self": 69.9527939328982
	}
	}
	},
	"workers": {
	"total": 0.5584856903878972,
	"count": 47286,
	"self": 0.0,
	"children": {
	"worker_root": {
	"total": 2001.7802101577108,
	"count": 47286,
	"is_parallel": true,
	"self": 753.0852439897717,
	"children": {
	"run_training.setup": {
	"total": 0.0,
	"count": 0,
	"is_parallel": true,
	"self": 0.0,
	"children": {
	"steps_from_proto": {
	"total": 0.013564358989242464,
	"count": 1,
	"is_parallel": true,
	"self": 0.002854533988283947,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 0.010709825000958517,
	"count": 8,
	"is_parallel": true,
	"self": 0.010709825000958517
	}
	}
	},
	"UnityEnvironment.step": {
	"total": 0.06518930001766421,
	"count": 1,
	"is_parallel": true,
	"self": 0.0010782770114019513,
	"children": {
	"UnityEnvironment._generate_step_input": {
	"total": 0.0008892060141079128,
	"count": 1,
	"is_parallel": true,
	"self": 0.0008892060141079128
	},
	"communicator.exchange": {
	"total": 0.05995043198345229,
	"count": 1,
	"is_parallel": true,
	"self": 0.05995043198345229
	},
	"steps_from_proto": {
	"total": 0.0032713850087020546,
	"count": 1,
	"is_parallel": true,
	"self": 0.0007223400461953133,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 0.0025490449625067413,
	"count": 8,
	"is_parallel": true,
	"self": 0.0025490449625067413
	}
	}
	}
	}
	}
	}
	},
	"UnityEnvironment.step": {
	"total": 1248.6949661679391,
	"count": 47285,
	"is_parallel": true,
	"self": 44.633973296004115,
	"children": {
	"UnityEnvironment._generate_step_input": {
	"total": 33.083338855649345,
	"count": 47285,
	"is_parallel": true,
	"self": 33.083338855649345
	},
	"communicator.exchange": {
	"total": 1047.8523495950503,
	"count": 47285,
	"is_parallel": true,
	"self": 1047.8523495950503
	},
	"steps_from_proto": {
	"total": 123.12530442123534,
	"count": 47285,
	"is_parallel": true,
	"self": 26.948400199238677,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 96.17690422199667,
	"count": 378280,
	"is_parallel": true,
	"self": 96.17690422199667
	}
	}
	}
	}
	}
	}
	}
	}
	}
	}
	},
	"trainer_advance": {
	"total": 569.9766172385134,
	"count": 47286,
	"self": 1.657787573582027,
	"children": {
	"process_trajectory": {
	"total": 71.81227012249292,
	"count": 47286,
	"self": 71.64519006150658,
	"children": {
	"RLTrainer._checkpoint": {
	"total": 0.16708006098633632,
	"count": 1,
	"self": 0.16708006098633632
	}
	}
	},
	"_update_policy": {
	"total": 496.5065595424385,
	"count": 330,
	"self": 251.4980613142252,
	"children": {
	"TorchPPOOptimizer.update": {
	"total": 245.00849822821328,
	"count": 16938,
	"self": 245.00849822821328
	}
	}
	}
	}
	}
	}
	},
	"trainer_threads": {
	"total": 3.762979758903384e-06,
	"count": 1,
	"self": 3.762979758903384e-06
	},
	"TrainerController._save_models": {
	"total": 2.230549311003415,
	"count": 1,
	"self": 0.017922976025147364,
	"children": {
	"RLTrainer._checkpoint": {
	"total": 2.2126263349782676,
	"count": 1,
	"self": 2.2126263349782676
	}
	}
	}
	}
	}
	}
	}