version one

480b651 verified about 1 year ago

18.7 kB

	{
	"name": "root",
	"gauges": {
	"Pyramids.Policy.Entropy.mean": {
	"value": 0.6612257361412048,
	"min": 0.6612257361412048,
	"max": 1.3829609155654907,
	"count": 33
	},
	"Pyramids.Policy.Entropy.sum": {
	"value": 19678.078125,
	"min": 19678.078125,
	"max": 41953.50390625,
	"count": 33
	},
	"Pyramids.Step.mean": {
	"value": 989883.0,
	"min": 29952.0,
	"max": 989883.0,
	"count": 33
	},
	"Pyramids.Step.sum": {
	"value": 989883.0,
	"min": 29952.0,
	"max": 989883.0,
	"count": 33
	},
	"Pyramids.Policy.ExtrinsicValueEstimate.mean": {
	"value": 0.0627322718501091,
	"min": -0.11199305951595306,
	"max": 0.09172578901052475,
	"count": 33
	},
	"Pyramids.Policy.ExtrinsicValueEstimate.sum": {
	"value": 15.432138442993164,
	"min": -27.102319717407227,
	"max": 22.656269073486328,
	"count": 33
	},
	"Pyramids.Policy.RndValueEstimate.mean": {
	"value": 0.02176976017653942,
	"min": 0.007074796594679356,
	"max": 0.35083121061325073,
	"count": 33
	},
	"Pyramids.Policy.RndValueEstimate.sum": {
	"value": 5.355360984802246,
	"min": 1.7474747896194458,
	"max": 84.19949340820312,
	"count": 33
	},
	"Pyramids.Losses.PolicyLoss.mean": {
	"value": 0.06850646806835832,
	"min": 0.06398289415049703,
	"max": 0.07310759250863705,
	"count": 33
	},
	"Pyramids.Losses.PolicyLoss.sum": {
	"value": 0.9590905529570164,
	"min": 0.4798651467052846,
	"max": 1.0437771753045928,
	"count": 33
	},
	"Pyramids.Losses.ValueLoss.mean": {
	"value": 0.005933725971596435,
	"min": 0.0002992366546125215,
	"max": 0.005982384877318827,
	"count": 33
	},
	"Pyramids.Losses.ValueLoss.sum": {
	"value": 0.08307216360235009,
	"min": 0.002992366546125215,
	"max": 0.08307216360235009,
	"count": 33
	},
	"Pyramids.Policy.LearningRate.mean": {
	"value": 7.464118940564287e-06,
	"min": 7.464118940564287e-06,
	"max": 0.00029515063018788575,
	"count": 33
	},
	"Pyramids.Policy.LearningRate.sum": {
	"value": 0.00010449766516790002,
	"min": 0.00010449766516790002,
	"max": 0.0030207608930798,
	"count": 33
	},
	"Pyramids.Policy.Epsilon.mean": {
	"value": 0.10248800714285713,
	"min": 0.10248800714285713,
	"max": 0.19838354285714285,
	"count": 33
	},
	"Pyramids.Policy.Epsilon.sum": {
	"value": 1.4348321,
	"min": 1.3691136000000002,
	"max": 2.359057,
	"count": 33
	},
	"Pyramids.Policy.Beta.mean": {
	"value": 0.0002585519135714287,
	"min": 0.0002585519135714287,
	"max": 0.00983851593142857,
	"count": 33
	},
	"Pyramids.Policy.Beta.sum": {
	"value": 0.003619726790000002,
	"min": 0.003619726790000002,
	"max": 0.10072132798,
	"count": 33
	},
	"Pyramids.Losses.RNDLoss.mean": {
	"value": 0.014452091418206692,
	"min": 0.014279200695455074,
	"max": 0.42627301812171936,
	"count": 33
	},
	"Pyramids.Losses.RNDLoss.sum": {
	"value": 0.20232927799224854,
	"min": 0.20070239901542664,
	"max": 2.9839110374450684,
	"count": 33
	},
	"Pyramids.Environment.EpisodeLength.mean": {
	"value": 805.4,
	"min": 795.5263157894736,
	"max": 999.0,
	"count": 33
	},
	"Pyramids.Environment.EpisodeLength.sum": {
	"value": 28189.0,
	"min": 15984.0,
	"max": 32406.0,
	"count": 33
	},
	"Pyramids.Environment.CumulativeReward.mean": {
	"value": 0.28002281444413324,
	"min": -1.0000000521540642,
	"max": 0.28002281444413324,
	"count": 33
	},
	"Pyramids.Environment.CumulativeReward.sum": {
	"value": 9.800798505544662,
	"min": -32.000001668930054,
	"max": 9.800798505544662,
	"count": 33
	},
	"Pyramids.Policy.ExtrinsicReward.mean": {
	"value": 0.28002281444413324,
	"min": -1.0000000521540642,
	"max": 0.28002281444413324,
	"count": 33
	},
	"Pyramids.Policy.ExtrinsicReward.sum": {
	"value": 9.800798505544662,
	"min": -32.000001668930054,
	"max": 9.800798505544662,
	"count": 33
	},
	"Pyramids.Policy.RndReward.mean": {
	"value": 0.12133785032866788,
	"min": 0.11832984130925094,
	"max": 8.416626082733274,
	"count": 33
	},
	"Pyramids.Policy.RndReward.sum": {
	"value": 4.246824761503376,
	"min": 4.213088566903025,
	"max": 134.66601732373238,
	"count": 33
	},
	"Pyramids.IsTraining.mean": {
	"value": 1.0,
	"min": 1.0,
	"max": 1.0,
	"count": 33
	},
	"Pyramids.IsTraining.sum": {
	"value": 1.0,
	"min": 1.0,
	"max": 1.0,
	"count": 33
	}
	},
	"metadata": {
	"timer_format_version": "0.1.0",
	"start_time_seconds": "1742555351",
	"python_version": "3.10.12 (main, Jul 5 2023, 18:54:27) [GCC 11.2.0]",
	"command_line_arguments": "/usr/local/bin/mlagents-learn ./config/ppo/PyramidsRND.yaml --env=./training-envs-executables/linux/Pyramids/Pyramids --run-id=Pyramids Training --no-graphics",
	"mlagents_version": "1.2.0.dev0",
	"mlagents_envs_version": "1.2.0.dev0",
	"communication_protocol_version": "1.5.0",
	"pytorch_version": "2.6.0+cu124",
	"numpy_version": "1.23.5",
	"end_time_seconds": "1742557830"
	},
	"total": 2479.1611598629997,
	"count": 1,
	"self": 0.5758834610001031,
	"children": {
	"run_training.setup": {
	"total": 0.034341406999828905,
	"count": 1,
	"self": 0.034341406999828905
	},
	"TrainerController.start_learning": {
	"total": 2478.550934995,
	"count": 1,
	"self": 2.433458263002649,
	"children": {
	"TrainerController._reset_env": {
	"total": 2.978400418000092,
	"count": 1,
	"self": 2.978400418000092
	},
	"TrainerController.advance": {
	"total": 2473.0697424669975,
	"count": 63162,
	"self": 2.4555728870204803,
	"children": {
	"env_step": {
	"total": 1645.1093814070057,
	"count": 63162,
	"self": 1487.5745012469147,
	"children": {
	"SubprocessEnvManager._take_step": {
	"total": 156.12895080501517,
	"count": 63162,
	"self": 6.11167329604973,
	"children": {
	"TorchPolicy.evaluate": {
	"total": 150.01727750896544,
	"count": 62546,
	"self": 150.01727750896544
	}
	}
	},
	"workers": {
	"total": 1.4059293550758412,
	"count": 63162,
	"self": 0.0,
	"children": {
	"worker_root": {
	"total": 2471.5795739230416,
	"count": 63162,
	"is_parallel": true,
	"self": 1141.1593669769836,
	"children": {
	"run_training.setup": {
	"total": 0.0,
	"count": 0,
	"is_parallel": true,
	"self": 0.0,
	"children": {
	"steps_from_proto": {
	"total": 0.004115429999956177,
	"count": 1,
	"is_parallel": true,
	"self": 0.0016213500002777437,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 0.0024940799996784335,
	"count": 8,
	"is_parallel": true,
	"self": 0.0024940799996784335
	}
	}
	},
	"UnityEnvironment.step": {
	"total": 0.07220375299993975,
	"count": 1,
	"is_parallel": true,
	"self": 0.0005890499996894505,
	"children": {
	"UnityEnvironment._generate_step_input": {
	"total": 0.000539300000127696,
	"count": 1,
	"is_parallel": true,
	"self": 0.000539300000127696
	},
	"communicator.exchange": {
	"total": 0.06930812300015532,
	"count": 1,
	"is_parallel": true,
	"self": 0.06930812300015532
	},
	"steps_from_proto": {
	"total": 0.0017672799999672861,
	"count": 1,
	"is_parallel": true,
	"self": 0.0003825600001619023,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 0.0013847199998053838,
	"count": 8,
	"is_parallel": true,
	"self": 0.0013847199998053838
	}
	}
	}
	}
	}
	}
	},
	"UnityEnvironment.step": {
	"total": 1330.420206946058,
	"count": 63161,
	"is_parallel": true,
	"self": 38.685660551049295,
	"children": {
	"UnityEnvironment._generate_step_input": {
	"total": 27.595473760981577,
	"count": 63161,
	"is_parallel": true,
	"self": 27.595473760981577
	},
	"communicator.exchange": {
	"total": 1162.6839711710654,
	"count": 63161,
	"is_parallel": true,
	"self": 1162.6839711710654
	},
	"steps_from_proto": {
	"total": 101.4551014629617,
	"count": 63161,
	"is_parallel": true,
	"self": 23.00321879287071,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 78.45188267009098,
	"count": 505288,
	"is_parallel": true,
	"self": 78.45188267009098
	}
	}
	}
	}
	}
	}
	}
	}
	}
	}
	},
	"trainer_advance": {
	"total": 825.5047881729715,
	"count": 63162,
	"self": 4.589303499991047,
	"children": {
	"process_trajectory": {
	"total": 138.26821690098018,
	"count": 63162,
	"self": 137.73092742998028,
	"children": {
	"RLTrainer._checkpoint": {
	"total": 0.5372894709998945,
	"count": 2,
	"self": 0.5372894709998945
	}
	}
	},
	"_update_policy": {
	"total": 682.6472677720003,
	"count": 433,
	"self": 264.3730516609744,
	"children": {
	"TorchPPOOptimizer.update": {
	"total": 418.2742161110259,
	"count": 22863,
	"self": 418.2742161110259
	}
	}
	}
	}
	}
	}
	},
	"trainer_threads": {
	"total": 1.4299998838396277e-06,
	"count": 1,
	"self": 1.4299998838396277e-06
	},
	"TrainerController._save_models": {
	"total": 0.06933241699971404,
	"count": 1,
	"self": 0.0014144899996608729,
	"children": {
	"RLTrainer._checkpoint": {
	"total": 0.06791792700005317,
	"count": 1,
	"self": 0.06791792700005317
	}
	}
	}
	}
	}
	}
	}