Changyu Gao

First Push

b26adec almost 3 years ago

18.3 kB

	{
	"name": "root",
	"gauges": {
	"Pyramids.Policy.Entropy.mean": {
	"value": 0.925483763217926,
	"min": 0.925483763217926,
	"max": 1.4854224920272827,
	"count": 5
	},
	"Pyramids.Policy.Entropy.sum": {
	"value": 28105.091796875,
	"min": 28105.091796875,
	"max": 45061.77734375,
	"count": 5
	},
	"Pyramids.Step.mean": {
	"value": 149982.0,
	"min": 29952.0,
	"max": 149982.0,
	"count": 5
	},
	"Pyramids.Step.sum": {
	"value": 149982.0,
	"min": 29952.0,
	"max": 149982.0,
	"count": 5
	},
	"Pyramids.Policy.ExtrinsicValueEstimate.mean": {
	"value": -0.05815637856721878,
	"min": -0.09418731182813644,
	"max": 0.0001792570692487061,
	"count": 5
	},
	"Pyramids.Policy.ExtrinsicValueEstimate.sum": {
	"value": -14.131999969482422,
	"min": -22.699142456054688,
	"max": 0.04248392581939697,
	"count": 5
	},
	"Pyramids.Policy.RndValueEstimate.mean": {
	"value": 0.08950106799602509,
	"min": 0.08950106799602509,
	"max": 0.3058807849884033,
	"count": 5
	},
	"Pyramids.Policy.RndValueEstimate.sum": {
	"value": 21.748760223388672,
	"min": 21.748760223388672,
	"max": 72.49374389648438,
	"count": 5
	},
	"Pyramids.Losses.PolicyLoss.mean": {
	"value": 0.06793653849306233,
	"min": 0.06793653849306233,
	"max": 0.0716153584697478,
	"count": 5
	},
	"Pyramids.Losses.PolicyLoss.sum": {
	"value": 0.8831750004098102,
	"min": 0.4887146136687329,
	"max": 0.8831750004098102,
	"count": 5
	},
	"Pyramids.Losses.ValueLoss.mean": {
	"value": 0.002622824082214735,
	"min": 0.0005557609182493178,
	"max": 0.006334852572088312,
	"count": 5
	},
	"Pyramids.Losses.ValueLoss.sum": {
	"value": 0.034096713068791557,
	"min": 0.0044460873459945425,
	"max": 0.044343968004618185,
	"count": 5
	},
	"Pyramids.Policy.LearningRate.mean": {
	"value": 0.00021874271939346154,
	"min": 0.00021874271939346154,
	"max": 0.00029030126037577137,
	"count": 5
	},
	"Pyramids.Policy.LearningRate.sum": {
	"value": 0.002843655352115,
	"min": 0.0019146816617728003,
	"max": 0.002843655352115,
	"count": 5
	},
	"Pyramids.Policy.Epsilon.mean": {
	"value": 0.1729142307692308,
	"min": 0.1729142307692308,
	"max": 0.19676708571428575,
	"count": 5
	},
	"Pyramids.Policy.Epsilon.sum": {
	"value": 2.247885,
	"min": 1.3382272,
	"max": 2.247885,
	"count": 5
	},
	"Pyramids.Policy.Beta.mean": {
	"value": 0.007294131653846152,
	"min": 0.007294131653846152,
	"max": 0.00967703186285714,
	"count": 5
	},
	"Pyramids.Policy.Beta.sum": {
	"value": 0.09482371149999998,
	"min": 0.06382889727999999,
	"max": 0.09482371149999998,
	"count": 5
	},
	"Pyramids.Losses.RNDLoss.mean": {
	"value": 0.07258495688438416,
	"min": 0.07258495688438416,
	"max": 0.4456627666950226,
	"count": 5
	},
	"Pyramids.Losses.RNDLoss.sum": {
	"value": 0.9436044692993164,
	"min": 0.9436044692993164,
	"max": 3.1196393966674805,
	"count": 5
	},
	"Pyramids.Environment.EpisodeLength.mean": {
	"value": 951.2857142857143,
	"min": 942.8787878787879,
	"max": 999.0,
	"count": 5
	},
	"Pyramids.Environment.EpisodeLength.sum": {
	"value": 33295.0,
	"min": 15984.0,
	"max": 33295.0,
	"count": 5
	},
	"Pyramids.Environment.CumulativeReward.mean": {
	"value": -0.6663200523172106,
	"min": -1.0000000521540642,
	"max": -0.6406727760578647,
	"count": 5
	},
	"Pyramids.Environment.CumulativeReward.sum": {
	"value": -23.32120183110237,
	"min": -32.000001668930054,
	"max": -16.000000834465027,
	"count": 5
	},
	"Pyramids.Policy.ExtrinsicReward.mean": {
	"value": -0.6663200523172106,
	"min": -1.0000000521540642,
	"max": -0.6406727760578647,
	"count": 5
	},
	"Pyramids.Policy.ExtrinsicReward.sum": {
	"value": -23.32120183110237,
	"min": -32.000001668930054,
	"max": -16.000000834465027,
	"count": 5
	},
	"Pyramids.Policy.RndReward.mean": {
	"value": 0.7318932928144932,
	"min": 0.7318932928144932,
	"max": 9.054668163880706,
	"count": 5
	},
	"Pyramids.Policy.RndReward.sum": {
	"value": 25.61626524850726,
	"min": 25.61626524850726,
	"max": 144.8746906220913,
	"count": 5
	},
	"Pyramids.IsTraining.mean": {
	"value": 1.0,
	"min": 1.0,
	"max": 1.0,
	"count": 5
	},
	"Pyramids.IsTraining.sum": {
	"value": 1.0,
	"min": 1.0,
	"max": 1.0,
	"count": 5
	}
	},
	"metadata": {
	"timer_format_version": "0.1.0",
	"start_time_seconds": "1686166175",
	"python_version": "3.10.11 (main, Apr 5 2023, 14:15:10) [GCC 9.4.0]",
	"command_line_arguments": "/usr/local/bin/mlagents-learn ./config/ppo/PyramidsRND.yaml --env=./training-envs-executables/linux/Pyramids/Pyramids --run-id=Pyramids Training --no-graphics",
	"mlagents_version": "0.31.0.dev0",
	"mlagents_envs_version": "0.31.0.dev0",
	"communication_protocol_version": "1.5.0",
	"pytorch_version": "1.11.0+cu102",
	"numpy_version": "1.21.2",
	"end_time_seconds": "1686166530"
	},
	"total": 355.3194051390003,
	"count": 1,
	"self": 0.4724490980004248,
	"children": {
	"run_training.setup": {
	"total": 0.05494175700005144,
	"count": 1,
	"self": 0.05494175700005144
	},
	"TrainerController.start_learning": {
	"total": 354.79201428399983,
	"count": 1,
	"self": 0.23012636901921724,
	"children": {
	"TrainerController._reset_env": {
	"total": 4.8237584920000245,
	"count": 1,
	"self": 4.8237584920000245
	},
	"TrainerController.advance": {
	"total": 349.7348349659808,
	"count": 11205,
	"self": 0.23454281000113042,
	"children": {
	"env_step": {
	"total": 236.48923420098936,
	"count": 11205,
	"self": 216.9719004049955,
	"children": {
	"SubprocessEnvManager._take_step": {
	"total": 19.382279875993618,
	"count": 11205,
	"self": 0.825565159010921,
	"children": {
	"TorchPolicy.evaluate": {
	"total": 18.556714716982697,
	"count": 11177,
	"self": 18.556714716982697
	}
	}
	},
	"workers": {
	"total": 0.13505392000024585,
	"count": 11204,
	"self": 0.0,
	"children": {
	"worker_root": {
	"total": 354.09471588100655,
	"count": 11204,
	"is_parallel": true,
	"self": 156.39775927301412,
	"children": {
	"run_training.setup": {
	"total": 0.0,
	"count": 0,
	"is_parallel": true,
	"self": 0.0,
	"children": {
	"steps_from_proto": {
	"total": 0.004157110000051034,
	"count": 1,
	"is_parallel": true,
	"self": 0.002264487999582343,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 0.0018926220004686911,
	"count": 8,
	"is_parallel": true,
	"self": 0.0018926220004686911
	}
	}
	},
	"UnityEnvironment.step": {
	"total": 0.04948453800011521,
	"count": 1,
	"is_parallel": true,
	"self": 0.0005666399999881833,
	"children": {
	"UnityEnvironment._generate_step_input": {
	"total": 0.0005429540001387068,
	"count": 1,
	"is_parallel": true,
	"self": 0.0005429540001387068
	},
	"communicator.exchange": {
	"total": 0.046561502000031396,
	"count": 1,
	"is_parallel": true,
	"self": 0.046561502000031396
	},
	"steps_from_proto": {
	"total": 0.0018134419999569218,
	"count": 1,
	"is_parallel": true,
	"self": 0.00035785599993687356,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 0.0014555860000200482,
	"count": 8,
	"is_parallel": true,
	"self": 0.0014555860000200482
	}
	}
	}
	}
	}
	}
	},
	"UnityEnvironment.step": {
	"total": 197.69695660799243,
	"count": 11203,
	"is_parallel": true,
	"self": 5.61437618796117,
	"children": {
	"UnityEnvironment._generate_step_input": {
	"total": 4.01434996302919,
	"count": 11203,
	"is_parallel": true,
	"self": 4.01434996302919
	},
	"communicator.exchange": {
	"total": 170.770776979007,
	"count": 11203,
	"is_parallel": true,
	"self": 170.770776979007
	},
	"steps_from_proto": {
	"total": 17.297453477995077,
	"count": 11203,
	"is_parallel": true,
	"self": 3.5061899969916794,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 13.791263481003398,
	"count": 89624,
	"is_parallel": true,
	"self": 13.791263481003398
	}
	}
	}
	}
	}
	}
	}
	}
	}
	}
	},
	"trainer_advance": {
	"total": 113.01105795499029,
	"count": 11204,
	"self": 0.3113298669898086,
	"children": {
	"process_trajectory": {
	"total": 17.913187625001456,
	"count": 11204,
	"self": 17.913187625001456
	},
	"_update_policy": {
	"total": 94.78654046299903,
	"count": 58,
	"self": 60.67647631799355,
	"children": {
	"TorchPPOOptimizer.update": {
	"total": 34.11006414500548,
	"count": 4122,
	"self": 34.11006414500548
	}
	}
	}
	}
	}
	}
	},
	"trainer_threads": {
	"total": 1.3730000318901148e-06,
	"count": 1,
	"self": 1.3730000318901148e-06
	},
	"TrainerController._save_models": {
	"total": 0.0032930839997789008,
	"count": 1,
	"self": 2.256399966427125e-05,
	"children": {
	"RLTrainer._checkpoint": {
	"total": 0.0032705200001146295,
	"count": 1,
	"self": 0.0032705200001146295
	}
	}
	}
	}
	}
	}
	}