First Push

3ea08aa verified 10 months ago

18.8 kB

	{
	"name": "root",
	"gauges": {
	"Pyramids.Policy.Entropy.mean": {
	"value": 0.15558169782161713,
	"min": 0.1472327560186386,
	"max": 1.4351273775100708,
	"count": 100
	},
	"Pyramids.Policy.Entropy.sum": {
	"value": 4640.068359375,
	"min": 4440.5400390625,
	"max": 43536.0234375,
	"count": 100
	},
	"Pyramids.Step.mean": {
	"value": 2999890.0,
	"min": 29999.0,
	"max": 2999890.0,
	"count": 100
	},
	"Pyramids.Step.sum": {
	"value": 2999890.0,
	"min": 29999.0,
	"max": 2999890.0,
	"count": 100
	},
	"Pyramids.Policy.ExtrinsicValueEstimate.mean": {
	"value": 0.765562117099762,
	"min": -0.10001370310783386,
	"max": 0.765562117099762,
	"count": 100
	},
	"Pyramids.Policy.ExtrinsicValueEstimate.sum": {
	"value": 225.07525634765625,
	"min": -24.20331573486328,
	"max": 225.07525634765625,
	"count": 100
	},
	"Pyramids.Policy.RndValueEstimate.mean": {
	"value": 0.006237243302166462,
	"min": -0.008571779355406761,
	"max": 0.371082603931427,
	"count": 100
	},
	"Pyramids.Policy.RndValueEstimate.sum": {
	"value": 1.833749532699585,
	"min": -2.3058085441589355,
	"max": 88.31765747070312,
	"count": 100
	},
	"Pyramids.Losses.PolicyLoss.mean": {
	"value": 0.07195211294608199,
	"min": 0.06418452211591,
	"max": 0.07522810055901144,
	"count": 100
	},
	"Pyramids.Losses.PolicyLoss.sum": {
	"value": 1.007329581245148,
	"min": 0.4885829520223116,
	"max": 1.0727810624230187,
	"count": 100
	},
	"Pyramids.Losses.ValueLoss.mean": {
	"value": 0.014831242285863563,
	"min": 0.00025144599525025384,
	"max": 0.016989849534140726,
	"count": 100
	},
	"Pyramids.Losses.ValueLoss.sum": {
	"value": 0.2076373920020899,
	"min": 0.0032687979382533,
	"max": 0.2433097602430886,
	"count": 100
	},
	"Pyramids.Policy.LearningRate.mean": {
	"value": 1.4847995050999992e-06,
	"min": 1.4847995050999992e-06,
	"max": 0.00029838354339596195,
	"count": 100
	},
	"Pyramids.Policy.LearningRate.sum": {
	"value": 2.078719307139999e-05,
	"min": 2.078719307139999e-05,
	"max": 0.003969052576982499,
	"count": 100
	},
	"Pyramids.Policy.Epsilon.mean": {
	"value": 0.10049490000000001,
	"min": 0.10049490000000001,
	"max": 0.19946118095238097,
	"count": 100
	},
	"Pyramids.Policy.Epsilon.sum": {
	"value": 1.4069286,
	"min": 1.3962282666666668,
	"max": 2.723017500000001,
	"count": 100
	},
	"Pyramids.Policy.Beta.mean": {
	"value": 5.944050999999997e-05,
	"min": 5.944050999999997e-05,
	"max": 0.009946171977142856,
	"count": 100
	},
	"Pyramids.Policy.Beta.sum": {
	"value": 0.0008321671399999995,
	"min": 0.0008321671399999995,
	"max": 0.13230944825,
	"count": 100
	},
	"Pyramids.Losses.RNDLoss.mean": {
	"value": 0.0050049638375639915,
	"min": 0.004398328252136707,
	"max": 0.34621429443359375,
	"count": 100
	},
	"Pyramids.Losses.RNDLoss.sum": {
	"value": 0.07006949186325073,
	"min": 0.06157659366726875,
	"max": 2.4235000610351562,
	"count": 100
	},
	"Pyramids.Environment.EpisodeLength.mean": {
	"value": 231.66153846153847,
	"min": 231.66153846153847,
	"max": 999.0,
	"count": 100
	},
	"Pyramids.Environment.EpisodeLength.sum": {
	"value": 30116.0,
	"min": 16798.0,
	"max": 32780.0,
	"count": 100
	},
	"Pyramids.Environment.CumulativeReward.mean": {
	"value": 1.7683384462044789,
	"min": -0.9999484395788562,
	"max": 1.7683384462044789,
	"count": 100
	},
	"Pyramids.Environment.CumulativeReward.sum": {
	"value": 229.88399800658226,
	"min": -30.998401626944542,
	"max": 229.88399800658226,
	"count": 100
	},
	"Pyramids.Policy.ExtrinsicReward.mean": {
	"value": 1.7683384462044789,
	"min": -0.9999484395788562,
	"max": 1.7683384462044789,
	"count": 100
	},
	"Pyramids.Policy.ExtrinsicReward.sum": {
	"value": 229.88399800658226,
	"min": -30.998401626944542,
	"max": 229.88399800658226,
	"count": 100
	},
	"Pyramids.Policy.RndReward.mean": {
	"value": 0.01202009530702176,
	"min": 0.01202009530702176,
	"max": 6.632727971848319,
	"count": 100
	},
	"Pyramids.Policy.RndReward.sum": {
	"value": 1.5626123899128288,
	"min": 1.3960037025608472,
	"max": 112.75637552142143,
	"count": 100
	},
	"Pyramids.IsTraining.mean": {
	"value": 1.0,
	"min": 1.0,
	"max": 1.0,
	"count": 100
	},
	"Pyramids.IsTraining.sum": {
	"value": 1.0,
	"min": 1.0,
	"max": 1.0,
	"count": 100
	}
	},
	"metadata": {
	"timer_format_version": "0.1.0",
	"start_time_seconds": "1750769260",
	"python_version": "3.10.12 (main, Jul 5 2023, 18:54:27) [GCC 11.2.0]",
	"command_line_arguments": "/usr/local/bin/mlagents-learn ./config/ppo/PyramidsRND.yaml --env=./training-envs-executables/linux/Pyramids/Pyramids --run-id=Pyramids Training --no-graphics",
	"mlagents_version": "1.2.0.dev0",
	"mlagents_envs_version": "1.2.0.dev0",
	"communication_protocol_version": "1.5.0",
	"pytorch_version": "2.7.1+cu126",
	"numpy_version": "1.23.5",
	"end_time_seconds": "1750776035"
	},
	"total": 6774.91293902,
	"count": 1,
	"self": 0.47630109199963044,
	"children": {
	"run_training.setup": {
	"total": 0.02976313499993921,
	"count": 1,
	"self": 0.02976313499993921
	},
	"TrainerController.start_learning": {
	"total": 6774.406874793,
	"count": 1,
	"self": 3.655272752934252,
	"children": {
	"TrainerController._reset_env": {
	"total": 2.263137302000132,
	"count": 1,
	"self": 2.263137302000132
	},
	"TrainerController.advance": {
	"total": 6768.399277221065,
	"count": 193521,
	"self": 3.9567093240020768,
	"children": {
	"env_step": {
	"total": 4840.817838260982,
	"count": 193521,
	"self": 4417.187091156227,
	"children": {
	"SubprocessEnvManager._take_step": {
	"total": 421.40556460703215,
	"count": 193521,
	"self": 13.051874900156236,
	"children": {
	"TorchPolicy.evaluate": {
	"total": 408.3536897068759,
	"count": 187548,
	"self": 408.3536897068759
	}
	}
	},
	"workers": {
	"total": 2.2251824977224715,
	"count": 193521,
	"self": 0.0,
	"children": {
	"worker_root": {
	"total": 6760.150085565226,
	"count": 193521,
	"is_parallel": true,
	"self": 2663.5029470041827,
	"children": {
	"run_training.setup": {
	"total": 0.0,
	"count": 0,
	"is_parallel": true,
	"self": 0.0,
	"children": {
	"steps_from_proto": {
	"total": 0.001928769999949509,
	"count": 1,
	"is_parallel": true,
	"self": 0.0006637619999310118,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 0.0012650080000184971,
	"count": 8,
	"is_parallel": true,
	"self": 0.0012650080000184971
	}
	}
	},
	"UnityEnvironment.step": {
	"total": 0.051287292999859346,
	"count": 1,
	"is_parallel": true,
	"self": 0.0005711480000627489,
	"children": {
	"UnityEnvironment._generate_step_input": {
	"total": 0.0005034250000335305,
	"count": 1,
	"is_parallel": true,
	"self": 0.0005034250000335305
	},
	"communicator.exchange": {
	"total": 0.048467296999888276,
	"count": 1,
	"is_parallel": true,
	"self": 0.048467296999888276
	},
	"steps_from_proto": {
	"total": 0.0017454229998747905,
	"count": 1,
	"is_parallel": true,
	"self": 0.0003859129994907562,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 0.0013595100003840344,
	"count": 8,
	"is_parallel": true,
	"self": 0.0013595100003840344
	}
	}
	}
	}
	}
	}
	},
	"UnityEnvironment.step": {
	"total": 4096.647138561043,
	"count": 193520,
	"is_parallel": true,
	"self": 94.08022039295383,
	"children": {
	"UnityEnvironment._generate_step_input": {
	"total": 66.43535728009715,
	"count": 193520,
	"is_parallel": true,
	"self": 66.43535728009715
	},
	"communicator.exchange": {
	"total": 3657.4118404110645,
	"count": 193520,
	"is_parallel": true,
	"self": 3657.4118404110645
	},
	"steps_from_proto": {
	"total": 278.7197204769277,
	"count": 193520,
	"is_parallel": true,
	"self": 55.6945413097319,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 223.0251791671958,
	"count": 1548160,
	"is_parallel": true,
	"self": 223.0251791671958
	}
	}
	}
	}
	}
	}
	}
	}
	}
	}
	},
	"trainer_advance": {
	"total": 1923.6247296360805,
	"count": 193521,
	"self": 7.528898271088792,
	"children": {
	"process_trajectory": {
	"total": 369.0966860849949,
	"count": 193521,
	"self": 368.57821221399627,
	"children": {
	"RLTrainer._checkpoint": {
	"total": 0.518473870998605,
	"count": 6,
	"self": 0.518473870998605
	}
	}
	},
	"_update_policy": {
	"total": 1546.9991452799968,
	"count": 1395,
	"self": 851.702338796903,
	"children": {
	"TorchPPOOptimizer.update": {
	"total": 695.2968064830939,
	"count": 68367,
	"self": 695.2968064830939
	}
	}
	}
	}
	}
	}
	},
	"trainer_threads": {
	"total": 8.53000528877601e-07,
	"count": 1,
	"self": 8.53000528877601e-07
	},
	"TrainerController._save_models": {
	"total": 0.0891866639994987,
	"count": 1,
	"self": 0.001364555999316508,
	"children": {
	"RLTrainer._checkpoint": {
	"total": 0.0878221080001822,
	"count": 1,
	"self": 0.0878221080001822
	}
	}
	}
	}
	}
	}
	}