First

90b1fcb verified about 2 years ago

18.8 kB

	{
	"name": "root",
	"gauges": {
	"Pyramids.Policy.Entropy.mean": {
	"value": 0.18705493211746216,
	"min": 0.16478247940540314,
	"max": 0.44203102588653564,
	"count": 33
	},
	"Pyramids.Policy.Entropy.sum": {
	"value": 5605.662109375,
	"min": 4938.201171875,
	"max": 12799.0361328125,
	"count": 33
	},
	"Pyramids.Environment.EpisodeLength.mean": {
	"value": 240.1328125,
	"min": 229.35245901639345,
	"max": 336.12359550561797,
	"count": 33
	},
	"Pyramids.Environment.EpisodeLength.sum": {
	"value": 30737.0,
	"min": 17589.0,
	"max": 32323.0,
	"count": 33
	},
	"Pyramids.Step.mean": {
	"value": 1979907.0,
	"min": 1019938.0,
	"max": 1979907.0,
	"count": 33
	},
	"Pyramids.Step.sum": {
	"value": 1979907.0,
	"min": 1019938.0,
	"max": 1979907.0,
	"count": 33
	},
	"Pyramids.Policy.ExtrinsicValueEstimate.mean": {
	"value": 0.7753037214279175,
	"min": 0.5842857956886292,
	"max": 0.7826550602912903,
	"count": 33
	},
	"Pyramids.Policy.ExtrinsicValueEstimate.sum": {
	"value": 234.1417236328125,
	"min": 112.94467163085938,
	"max": 234.1417236328125,
	"count": 33
	},
	"Pyramids.Policy.RndValueEstimate.mean": {
	"value": 0.007218698039650917,
	"min": -0.011078650131821632,
	"max": 0.023848215118050575,
	"count": 33
	},
	"Pyramids.Policy.RndValueEstimate.sum": {
	"value": 2.180046796798706,
	"min": -2.0495502948760986,
	"max": 6.987526893615723,
	"count": 33
	},
	"Pyramids.Environment.CumulativeReward.mean": {
	"value": 1.7451243954380666,
	"min": 1.5533956757956935,
	"max": 1.7542524447695154,
	"count": 33
	},
	"Pyramids.Environment.CumulativeReward.sum": {
	"value": 221.63079822063446,
	"min": 108.40999849885702,
	"max": 221.63079822063446,
	"count": 33
	},
	"Pyramids.Policy.ExtrinsicReward.mean": {
	"value": 1.7451243954380666,
	"min": 1.5533956757956935,
	"max": 1.7542524447695154,
	"count": 33
	},
	"Pyramids.Policy.ExtrinsicReward.sum": {
	"value": 221.63079822063446,
	"min": 108.40999849885702,
	"max": 221.63079822063446,
	"count": 33
	},
	"Pyramids.Policy.RndReward.mean": {
	"value": 0.024534388826761254,
	"min": 0.024235264870737006,
	"max": 0.04270739211014271,
	"count": 33
	},
	"Pyramids.Policy.RndReward.sum": {
	"value": 3.1158673809986794,
	"min": 2.254476272595639,
	"max": 3.9742181365727447,
	"count": 33
	},
	"Pyramids.Losses.PolicyLoss.mean": {
	"value": 0.06661360270559921,
	"min": 0.06401529681924904,
	"max": 0.07187034715371694,
	"count": 33
	},
	"Pyramids.Losses.PolicyLoss.sum": {
	"value": 0.9325904378783889,
	"min": 0.5761376713732413,
	"max": 1.074378561701023,
	"count": 33
	},
	"Pyramids.Losses.ValueLoss.mean": {
	"value": 0.016130074523278467,
	"min": 0.013827307654967978,
	"max": 0.017788065528859278,
	"count": 33
	},
	"Pyramids.Losses.ValueLoss.sum": {
	"value": 0.22582104332589853,
	"min": 0.141306401375914,
	"max": 0.2668209829328892,
	"count": 33
	},
	"Pyramids.Policy.LearningRate.mean": {
	"value": 5.160880422596431e-06,
	"min": 5.160880422596431e-06,
	"max": 0.00014840945053020002,
	"count": 33
	},
	"Pyramids.Policy.LearningRate.sum": {
	"value": 7.225232591635003e-05,
	"min": 7.225232591635003e-05,
	"max": 0.0020269283743574503,
	"count": 33
	},
	"Pyramids.Policy.Epsilon.mean": {
	"value": 0.10172026071428573,
	"min": 0.10172026071428573,
	"max": 0.14946979999999999,
	"count": 33
	},
	"Pyramids.Policy.Epsilon.sum": {
	"value": 1.4240836500000003,
	"min": 1.3452282,
	"max": 2.1564575500000003,
	"count": 33
	},
	"Pyramids.Policy.Beta.mean": {
	"value": 0.00018185404535714294,
	"min": 0.00018185404535714294,
	"max": 0.004952033020000001,
	"count": 33
	},
	"Pyramids.Policy.Beta.sum": {
	"value": 0.002545956635000001,
	"min": 0.002545956635000001,
	"max": 0.06763669074499999,
	"count": 33
	},
	"Pyramids.Losses.RNDLoss.mean": {
	"value": 0.009958143346011639,
	"min": 0.008901664055883884,
	"max": 0.012760956771671772,
	"count": 33
	},
	"Pyramids.Losses.RNDLoss.sum": {
	"value": 0.1394140124320984,
	"min": 0.11117810755968094,
	"max": 0.1889527291059494,
	"count": 33
	},
	"Pyramids.IsTraining.mean": {
	"value": 1.0,
	"min": 1.0,
	"max": 1.0,
	"count": 33
	},
	"Pyramids.IsTraining.sum": {
	"value": 1.0,
	"min": 1.0,
	"max": 1.0,
	"count": 33
	}
	},
	"metadata": {
	"timer_format_version": "0.1.0",
	"start_time_seconds": "1711997790",
	"python_version": "3.10.12 (main, Nov 20 2023, 15:14:05) [GCC 11.4.0]",
	"command_line_arguments": "/usr/local/bin/mlagents-learn ./config/ppo/PyramidsRND.yaml --env=./training-envs-executables/linux/Pyramids/Pyramids --run-id=Pyramids Training --no-graphics --resume",
	"mlagents_version": "1.1.0.dev0",
	"mlagents_envs_version": "1.1.0.dev0",
	"communication_protocol_version": "1.5.0",
	"pytorch_version": "2.2.1+cu121",
	"numpy_version": "1.23.5",
	"end_time_seconds": "1712000308"
	},
	"total": 2518.126583485,
	"count": 1,
	"self": 0.4756415490001018,
	"children": {
	"run_training.setup": {
	"total": 0.049040627000067616,
	"count": 1,
	"self": 0.049040627000067616
	},
	"TrainerController.start_learning": {
	"total": 2517.601901309,
	"count": 1,
	"self": 1.4609522070804815,
	"children": {
	"TrainerController._reset_env": {
	"total": 2.0384117109997533,
	"count": 1,
	"self": 2.0384117109997533
	},
	"TrainerController.advance": {
	"total": 2514.013688609919,
	"count": 65417,
	"self": 1.502925605067503,
	"children": {
	"env_step": {
	"total": 1874.6336485859447,
	"count": 65417,
	"self": 1740.1902416718713,
	"children": {
	"SubprocessEnvManager._take_step": {
	"total": 133.55975684108216,
	"count": 65417,
	"self": 4.7747069421711785,
	"children": {
	"TorchPolicy.evaluate": {
	"total": 128.78504989891098,
	"count": 62560,
	"self": 128.78504989891098
	}
	}
	},
	"workers": {
	"total": 0.8836500729912586,
	"count": 65417,
	"self": 0.0,
	"children": {
	"worker_root": {
	"total": 2512.251911310238,
	"count": 65417,
	"is_parallel": true,
	"self": 898.011206602202,
	"children": {
	"run_training.setup": {
	"total": 0.0,
	"count": 0,
	"is_parallel": true,
	"self": 0.0,
	"children": {
	"steps_from_proto": {
	"total": 0.0022879790003571543,
	"count": 1,
	"is_parallel": true,
	"self": 0.0006465400010711164,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 0.0016414389992860379,
	"count": 8,
	"is_parallel": true,
	"self": 0.0016414389992860379
	}
	}
	},
	"UnityEnvironment.step": {
	"total": 0.05712476000007882,
	"count": 1,
	"is_parallel": true,
	"self": 0.0032920459989327355,
	"children": {
	"UnityEnvironment._generate_step_input": {
	"total": 0.0004432969999470515,
	"count": 1,
	"is_parallel": true,
	"self": 0.0004432969999470515
	},
	"communicator.exchange": {
	"total": 0.05172769400087418,
	"count": 1,
	"is_parallel": true,
	"self": 0.05172769400087418
	},
	"steps_from_proto": {
	"total": 0.001661723000324855,
	"count": 1,
	"is_parallel": true,
	"self": 0.0003732569985004375,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 0.0012884660018244176,
	"count": 8,
	"is_parallel": true,
	"self": 0.0012884660018244176
	}
	}
	}
	}
	}
	}
	},
	"UnityEnvironment.step": {
	"total": 1614.240704708036,
	"count": 65416,
	"is_parallel": true,
	"self": 34.801910062221395,
	"children": {
	"UnityEnvironment._generate_step_input": {
	"total": 24.99356799708312,
	"count": 65416,
	"is_parallel": true,
	"self": 24.99356799708312
	},
	"communicator.exchange": {
	"total": 1451.0625788657353,
	"count": 65416,
	"is_parallel": true,
	"self": 1451.0625788657353
	},
	"steps_from_proto": {
	"total": 103.38264778299617,
	"count": 65416,
	"is_parallel": true,
	"self": 21.307672516118146,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 82.07497526687803,
	"count": 523328,
	"is_parallel": true,
	"self": 82.07497526687803
	}
	}
	}
	}
	}
	}
	}
	}
	}
	}
	},
	"trainer_advance": {
	"total": 637.8771144189068,
	"count": 65417,
	"self": 2.9310192950533747,
	"children": {
	"process_trajectory": {
	"total": 135.03107008984261,
	"count": 65417,
	"self": 134.81534168884173,
	"children": {
	"RLTrainer._checkpoint": {
	"total": 0.21572840100088797,
	"count": 2,
	"self": 0.21572840100088797
	}
	}
	},
	"_update_policy": {
	"total": 499.9150250340108,
	"count": 472,
	"self": 294.54177497197907,
	"children": {
	"TorchPPOOptimizer.update": {
	"total": 205.37325006203173,
	"count": 22713,
	"self": 205.37325006203173
	}
	}
	}
	}
	}
	}
	},
	"trainer_threads": {
	"total": 8.400002116104588e-07,
	"count": 1,
	"self": 8.400002116104588e-07
	},
	"TrainerController._save_models": {
	"total": 0.08884794100049476,
	"count": 1,
	"self": 0.0018642500008354546,
	"children": {
	"RLTrainer._checkpoint": {
	"total": 0.0869836909996593,
	"count": 1,
	"self": 0.0869836909996593
	}
	}
	}
	}
	}
	}
	}