First Push

d74856d almost 3 years ago

18.8 kB

	{
	"name": "root",
	"gauges": {
	"Pyramids.Policy.Entropy.mean": {
	"value": 0.17490901052951813,
	"min": 0.16398131847381592,
	"max": 1.4302674531936646,
	"count": 100
	},
	"Pyramids.Policy.Entropy.sum": {
	"value": 5278.05419921875,
	"min": 4903.697265625,
	"max": 43388.59375,
	"count": 100
	},
	"Pyramids.Step.mean": {
	"value": 2999951.0,
	"min": 29952.0,
	"max": 2999951.0,
	"count": 100
	},
	"Pyramids.Step.sum": {
	"value": 2999951.0,
	"min": 29952.0,
	"max": 2999951.0,
	"count": 100
	},
	"Pyramids.Policy.ExtrinsicValueEstimate.mean": {
	"value": 0.7282366752624512,
	"min": -0.10632584989070892,
	"max": 0.8514661192893982,
	"count": 100
	},
	"Pyramids.Policy.ExtrinsicValueEstimate.sum": {
	"value": 211.18862915039062,
	"min": -25.518203735351562,
	"max": 258.845703125,
	"count": 100
	},
	"Pyramids.Policy.RndValueEstimate.mean": {
	"value": -0.010904678143560886,
	"min": -0.019113825634121895,
	"max": 0.645065426826477,
	"count": 100
	},
	"Pyramids.Policy.RndValueEstimate.sum": {
	"value": -3.1623566150665283,
	"min": -5.791489124298096,
	"max": 152.88050842285156,
	"count": 100
	},
	"Pyramids.Losses.PolicyLoss.mean": {
	"value": 0.07045070029562339,
	"min": 0.06448170247578051,
	"max": 0.07583584167973723,
	"count": 100
	},
	"Pyramids.Losses.PolicyLoss.sum": {
	"value": 0.9863098041387275,
	"min": 0.5011433693446519,
	"max": 1.101917128583106,
	"count": 100
	},
	"Pyramids.Losses.ValueLoss.mean": {
	"value": 0.015463917435789924,
	"min": 0.00047009329222738805,
	"max": 0.02875869644473222,
	"count": 100
	},
	"Pyramids.Losses.ValueLoss.sum": {
	"value": 0.21649484410105893,
	"min": 0.006111212798956045,
	"max": 0.2539350916665759,
	"count": 100
	},
	"Pyramids.Policy.LearningRate.mean": {
	"value": 1.4725209377642907e-06,
	"min": 1.4725209377642907e-06,
	"max": 0.00029838354339596195,
	"count": 100
	},
	"Pyramids.Policy.LearningRate.sum": {
	"value": 2.061529312870007e-05,
	"min": 2.061529312870007e-05,
	"max": 0.0038429512190162997,
	"count": 100
	},
	"Pyramids.Policy.Epsilon.mean": {
	"value": 0.10049080714285714,
	"min": 0.10049080714285714,
	"max": 0.19946118095238097,
	"count": 100
	},
	"Pyramids.Policy.Epsilon.sum": {
	"value": 1.4068713,
	"min": 1.3897045333333333,
	"max": 2.722569266666667,
	"count": 100
	},
	"Pyramids.Policy.Beta.mean": {
	"value": 5.903163357142875e-05,
	"min": 5.903163357142875e-05,
	"max": 0.009946171977142856,
	"count": 100
	},
	"Pyramids.Policy.Beta.sum": {
	"value": 0.0008264428700000025,
	"min": 0.0008264428700000025,
	"max": 0.12811027163,
	"count": 100
	},
	"Pyramids.Losses.RNDLoss.mean": {
	"value": 0.005767387803643942,
	"min": 0.00550212012603879,
	"max": 0.593696653842926,
	"count": 100
	},
	"Pyramids.Losses.RNDLoss.sum": {
	"value": 0.08074343204498291,
	"min": 0.07702968269586563,
	"max": 4.155876636505127,
	"count": 100
	},
	"Pyramids.Environment.EpisodeLength.mean": {
	"value": 236.5984251968504,
	"min": 217.13533834586465,
	"max": 999.0,
	"count": 100
	},
	"Pyramids.Environment.EpisodeLength.sum": {
	"value": 30048.0,
	"min": 15984.0,
	"max": 32849.0,
	"count": 100
	},
	"Pyramids.Environment.CumulativeReward.mean": {
	"value": 1.7476456504989797,
	"min": -1.0000000521540642,
	"max": 1.7744094390334106,
	"count": 100
	},
	"Pyramids.Environment.CumulativeReward.sum": {
	"value": 221.95099761337042,
	"min": -32.000001668930054,
	"max": 241.5609978362918,
	"count": 100
	},
	"Pyramids.Policy.ExtrinsicReward.mean": {
	"value": 1.7476456504989797,
	"min": -1.0000000521540642,
	"max": 1.7744094390334106,
	"count": 100
	},
	"Pyramids.Policy.ExtrinsicReward.sum": {
	"value": 221.95099761337042,
	"min": -32.000001668930054,
	"max": 241.5609978362918,
	"count": 100
	},
	"Pyramids.Policy.RndReward.mean": {
	"value": 0.014373364153592645,
	"min": 0.0126526198067389,
	"max": 14.521467708051205,
	"count": 100
	},
	"Pyramids.Policy.RndReward.sum": {
	"value": 1.825417247506266,
	"min": 1.6723010244968464,
	"max": 232.34348332881927,
	"count": 100
	},
	"Pyramids.IsTraining.mean": {
	"value": 1.0,
	"min": 1.0,
	"max": 1.0,
	"count": 100
	},
	"Pyramids.IsTraining.sum": {
	"value": 1.0,
	"min": 1.0,
	"max": 1.0,
	"count": 100
	}
	},
	"metadata": {
	"timer_format_version": "0.1.0",
	"start_time_seconds": "1682587399",
	"python_version": "3.9.16 (main, Mar 8 2023, 14:00:05) \n[GCC 11.2.0]",
	"command_line_arguments": "/home/ntrant/anaconda3/envs/rl/bin/mlagents-learn ./config/ppo/PyramidsRND.yaml --env=./training-envs-executables/linux/Pyramids/Pyramids --run-id=Pyramids Training --no-graphics",
	"mlagents_version": "0.31.0.dev0",
	"mlagents_envs_version": "0.31.0.dev0",
	"communication_protocol_version": "1.5.0",
	"pytorch_version": "1.11.0+cu113",
	"numpy_version": "1.21.2",
	"end_time_seconds": "1682589781"
	},
	"total": 2382.4878098119516,
	"count": 1,
	"self": 0.21826302981935441,
	"children": {
	"run_training.setup": {
	"total": 0.01288121403194964,
	"count": 1,
	"self": 0.01288121403194964
	},
	"TrainerController.start_learning": {
	"total": 2382.2566655681003,
	"count": 1,
	"self": 1.9276359151117504,
	"children": {
	"TrainerController._reset_env": {
	"total": 3.888193927006796,
	"count": 1,
	"self": 3.888193927006796
	},
	"TrainerController.advance": {
	"total": 2376.393455961952,
	"count": 194535,
	"self": 1.8915775606874377,
	"children": {
	"env_step": {
	"total": 1443.0404986417852,
	"count": 194535,
	"self": 1283.5638633763883,
	"children": {
	"SubprocessEnvManager._take_step": {
	"total": 158.27946001267992,
	"count": 194535,
	"self": 6.123884355183691,
	"children": {
	"TorchPolicy.evaluate": {
	"total": 152.15557565749623,
	"count": 187557,
	"self": 152.15557565749623
	}
	}
	},
	"workers": {
	"total": 1.1971752527169883,
	"count": 194535,
	"self": 0.0,
	"children": {
	"worker_root": {
	"total": 2379.4368221322075,
	"count": 194535,
	"is_parallel": true,
	"self": 1226.9768003886566,
	"children": {
	"run_training.setup": {
	"total": 0.0,
	"count": 0,
	"is_parallel": true,
	"self": 0.0,
	"children": {
	"steps_from_proto": {
	"total": 0.0009483250323683023,
	"count": 1,
	"is_parallel": true,
	"self": 0.0002904192078858614,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 0.000657905824482441,
	"count": 8,
	"is_parallel": true,
	"self": 0.000657905824482441
	}
	}
	},
	"UnityEnvironment.step": {
	"total": 0.02145201014354825,
	"count": 1,
	"is_parallel": true,
	"self": 0.00024907919578254223,
	"children": {
	"UnityEnvironment._generate_step_input": {
	"total": 0.00029695802368223667,
	"count": 1,
	"is_parallel": true,
	"self": 0.00029695802368223667
	},
	"communicator.exchange": {
	"total": 0.020106848096475005,
	"count": 1,
	"is_parallel": true,
	"self": 0.020106848096475005
	},
	"steps_from_proto": {
	"total": 0.0007991248276084661,
	"count": 1,
	"is_parallel": true,
	"self": 0.00018501910381019115,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 0.000614105723798275,
	"count": 8,
	"is_parallel": true,
	"self": 0.000614105723798275
	}
	}
	}
	}
	}
	}
	},
	"UnityEnvironment.step": {
	"total": 1152.460021743551,
	"count": 194534,
	"is_parallel": true,
	"self": 37.468936015153304,
	"children": {
	"UnityEnvironment._generate_step_input": {
	"total": 25.305287588387728,
	"count": 194534,
	"is_parallel": true,
	"self": 25.305287588387728
	},
	"communicator.exchange": {
	"total": 981.8986218154896,
	"count": 194534,
	"is_parallel": true,
	"self": 981.8986218154896
	},
	"steps_from_proto": {
	"total": 107.78717632452026,
	"count": 194534,
	"is_parallel": true,
	"self": 23.479633159702644,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 84.30754316481762,
	"count": 1556272,
	"is_parallel": true,
	"self": 84.30754316481762
	}
	}
	}
	}
	}
	}
	}
	}
	}
	}
	},
	"trainer_advance": {
	"total": 931.4613797594793,
	"count": 194535,
	"self": 3.435052201617509,
	"children": {
	"process_trajectory": {
	"total": 156.43625362799503,
	"count": 194535,
	"self": 156.13586911163293,
	"children": {
	"RLTrainer._checkpoint": {
	"total": 0.30038451636210084,
	"count": 6,
	"self": 0.30038451636210084
	}
	}
	},
	"_update_policy": {
	"total": 771.5900739298668,
	"count": 1390,
	"self": 467.68752431566827,
	"children": {
	"TorchPPOOptimizer.update": {
	"total": 303.9025496141985,
	"count": 68376,
	"self": 303.9025496141985
	}
	}
	}
	}
	}
	}
	},
	"trainer_threads": {
	"total": 6.400514394044876e-07,
	"count": 1,
	"self": 6.400514394044876e-07
	},
	"TrainerController._save_models": {
	"total": 0.047379123978316784,
	"count": 1,
	"self": 0.0005925619043409824,
	"children": {
	"RLTrainer._checkpoint": {
	"total": 0.0467865620739758,
	"count": 1,
	"self": 0.0467865620739758
	}
	}
	}
	}
	}
	}
	}