First Push

ac16b94 over 2 years ago

18.7 kB

	{
	"name": "root",
	"gauges": {
	"Pyramids.Policy.Entropy.mean": {
	"value": 0.4401095509529114,
	"min": 0.42719903588294983,
	"max": 1.384224772453308,
	"count": 33
	},
	"Pyramids.Policy.Entropy.sum": {
	"value": 13175.119140625,
	"min": 12638.255859375,
	"max": 41991.84375,
	"count": 33
	},
	"Pyramids.Step.mean": {
	"value": 989888.0,
	"min": 29959.0,
	"max": 989888.0,
	"count": 33
	},
	"Pyramids.Step.sum": {
	"value": 989888.0,
	"min": 29959.0,
	"max": 989888.0,
	"count": 33
	},
	"Pyramids.Policy.ExtrinsicValueEstimate.mean": {
	"value": 0.3571150004863739,
	"min": -0.09607616066932678,
	"max": 0.40010347962379456,
	"count": 33
	},
	"Pyramids.Policy.ExtrinsicValueEstimate.sum": {
	"value": 95.70681762695312,
	"min": -22.866127014160156,
	"max": 106.82762908935547,
	"count": 33
	},
	"Pyramids.Policy.RndValueEstimate.mean": {
	"value": 0.027814822271466255,
	"min": -0.002628646558150649,
	"max": 0.3108713924884796,
	"count": 33
	},
	"Pyramids.Policy.RndValueEstimate.sum": {
	"value": 7.454372406005859,
	"min": -0.6939626932144165,
	"max": 73.98738861083984,
	"count": 33
	},
	"Pyramids.Losses.PolicyLoss.mean": {
	"value": 0.06379121950955043,
	"min": 0.06379121950955043,
	"max": 0.07260322353880232,
	"count": 33
	},
	"Pyramids.Losses.PolicyLoss.sum": {
	"value": 0.8930770731337059,
	"min": 0.5761177049408275,
	"max": 1.0890483530820347,
	"count": 33
	},
	"Pyramids.Losses.ValueLoss.mean": {
	"value": 0.017464480543692065,
	"min": 0.0013920487489709995,
	"max": 0.017464480543692065,
	"count": 33
	},
	"Pyramids.Losses.ValueLoss.sum": {
	"value": 0.2445027276116889,
	"min": 0.016704584987651993,
	"max": 0.2445027276116889,
	"count": 33
	},
	"Pyramids.Policy.LearningRate.mean": {
	"value": 7.436004664221429e-06,
	"min": 7.436004664221429e-06,
	"max": 0.00029501175166275,
	"count": 33
	},
	"Pyramids.Policy.LearningRate.sum": {
	"value": 0.00010410406529910001,
	"min": 0.00010410406529910001,
	"max": 0.003492330135889999,
	"count": 33
	},
	"Pyramids.Policy.Epsilon.mean": {
	"value": 0.1024786357142857,
	"min": 0.1024786357142857,
	"max": 0.19833725,
	"count": 33
	},
	"Pyramids.Policy.Epsilon.sum": {
	"value": 1.4347008999999997,
	"min": 1.4347008999999997,
	"max": 2.572383200000001,
	"count": 33
	},
	"Pyramids.Policy.Beta.mean": {
	"value": 0.0002576157078571429,
	"min": 0.0002576157078571429,
	"max": 0.009833891275,
	"count": 33
	},
	"Pyramids.Policy.Beta.sum": {
	"value": 0.0036066199100000004,
	"min": 0.0036066199100000004,
	"max": 0.11642458900000001,
	"count": 33
	},
	"Pyramids.Losses.RNDLoss.mean": {
	"value": 0.011781989596784115,
	"min": 0.011781989596784115,
	"max": 0.4199594259262085,
	"count": 33
	},
	"Pyramids.Losses.RNDLoss.sum": {
	"value": 0.16494785249233246,
	"min": 0.16494785249233246,
	"max": 3.359675407409668,
	"count": 33
	},
	"Pyramids.Environment.EpisodeLength.mean": {
	"value": 434.71830985915494,
	"min": 431.64179104477614,
	"max": 980.1875,
	"count": 33
	},
	"Pyramids.Environment.EpisodeLength.sum": {
	"value": 30865.0,
	"min": 16118.0,
	"max": 32598.0,
	"count": 33
	},
	"Pyramids.Environment.CumulativeReward.mean": {
	"value": 1.4306833122132554,
	"min": -0.8568424754070513,
	"max": 1.4306833122132554,
	"count": 33
	},
	"Pyramids.Environment.CumulativeReward.sum": {
	"value": 103.00919847935438,
	"min": -28.275801688432693,
	"max": 103.00919847935438,
	"count": 33
	},
	"Pyramids.Policy.ExtrinsicReward.mean": {
	"value": 1.4306833122132554,
	"min": -0.8568424754070513,
	"max": 1.4306833122132554,
	"count": 33
	},
	"Pyramids.Policy.ExtrinsicReward.sum": {
	"value": 103.00919847935438,
	"min": -28.275801688432693,
	"max": 103.00919847935438,
	"count": 33
	},
	"Pyramids.Policy.RndReward.mean": {
	"value": 0.05294481567964087,
	"min": 0.05294481567964087,
	"max": 8.271439988823499,
	"count": 33
	},
	"Pyramids.Policy.RndReward.sum": {
	"value": 3.8120267289341427,
	"min": 3.611602952965768,
	"max": 140.61447980999947,
	"count": 33
	},
	"Pyramids.IsTraining.mean": {
	"value": 1.0,
	"min": 1.0,
	"max": 1.0,
	"count": 33
	},
	"Pyramids.IsTraining.sum": {
	"value": 1.0,
	"min": 1.0,
	"max": 1.0,
	"count": 33
	}
	},
	"metadata": {
	"timer_format_version": "0.1.0",
	"start_time_seconds": "1691854164",
	"python_version": "3.10.12 (main, Jun 11 2023, 05:26:28) [GCC 11.4.0]",
	"command_line_arguments": "/usr/local/bin/mlagents-learn ./config/ppo/PyramidsRND.yaml --env=./training-envs-executables/linux/Pyramids/Pyramids --run-id=Pyramids Training --no-graphics",
	"mlagents_version": "0.31.0.dev0",
	"mlagents_envs_version": "0.31.0.dev0",
	"communication_protocol_version": "1.5.0",
	"pytorch_version": "1.11.0+cu102",
	"numpy_version": "1.21.2",
	"end_time_seconds": "1691856531"
	},
	"total": 2367.140538169,
	"count": 1,
	"self": 1.092234687000655,
	"children": {
	"run_training.setup": {
	"total": 0.04754448099993169,
	"count": 1,
	"self": 0.04754448099993169
	},
	"TrainerController.start_learning": {
	"total": 2366.0007590009996,
	"count": 1,
	"self": 1.4693136379933094,
	"children": {
	"TrainerController._reset_env": {
	"total": 4.11726319599984,
	"count": 1,
	"self": 4.11726319599984
	},
	"TrainerController.advance": {
	"total": 2360.2564457400067,
	"count": 63620,
	"self": 1.4253876988746015,
	"children": {
	"env_step": {
	"total": 1663.3963650271248,
	"count": 63620,
	"self": 1546.4751360310606,
	"children": {
	"SubprocessEnvManager._take_step": {
	"total": 116.02991351905393,
	"count": 63620,
	"self": 4.973095398084752,
	"children": {
	"TorchPolicy.evaluate": {
	"total": 111.05681812096918,
	"count": 62559,
	"self": 111.05681812096918
	}
	}
	},
	"workers": {
	"total": 0.8913154770102665,
	"count": 63620,
	"self": 0.0,
	"children": {
	"worker_root": {
	"total": 2360.4790948329883,
	"count": 63620,
	"is_parallel": true,
	"self": 934.3837678999507,
	"children": {
	"run_training.setup": {
	"total": 0.0,
	"count": 0,
	"is_parallel": true,
	"self": 0.0,
	"children": {
	"steps_from_proto": {
	"total": 0.0016927819997363258,
	"count": 1,
	"is_parallel": true,
	"self": 0.0005164719996173517,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 0.0011763100001189741,
	"count": 8,
	"is_parallel": true,
	"self": 0.0011763100001189741
	}
	}
	},
	"UnityEnvironment.step": {
	"total": 0.0460419420001017,
	"count": 1,
	"is_parallel": true,
	"self": 0.0005636020005113096,
	"children": {
	"UnityEnvironment._generate_step_input": {
	"total": 0.00047328299979199073,
	"count": 1,
	"is_parallel": true,
	"self": 0.00047328299979199073
	},
	"communicator.exchange": {
	"total": 0.04304329399974449,
	"count": 1,
	"is_parallel": true,
	"self": 0.04304329399974449
	},
	"steps_from_proto": {
	"total": 0.0019617630000539066,
	"count": 1,
	"is_parallel": true,
	"self": 0.00042235900082232547,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 0.0015394039992315811,
	"count": 8,
	"is_parallel": true,
	"self": 0.0015394039992315811
	}
	}
	}
	}
	}
	}
	},
	"UnityEnvironment.step": {
	"total": 1426.0953269330375,
	"count": 63619,
	"is_parallel": true,
	"self": 35.49173163098885,
	"children": {
	"UnityEnvironment._generate_step_input": {
	"total": 23.405742976981855,
	"count": 63619,
	"is_parallel": true,
	"self": 23.405742976981855
	},
	"communicator.exchange": {
	"total": 1257.3534896480783,
	"count": 63619,
	"is_parallel": true,
	"self": 1257.3534896480783
	},
	"steps_from_proto": {
	"total": 109.84436267698857,
	"count": 63619,
	"is_parallel": true,
	"self": 21.705387305205022,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 88.13897537178354,
	"count": 508952,
	"is_parallel": true,
	"self": 88.13897537178354
	}
	}
	}
	}
	}
	}
	}
	}
	}
	}
	},
	"trainer_advance": {
	"total": 695.4346930140073,
	"count": 63620,
	"self": 2.904138178959329,
	"children": {
	"process_trajectory": {
	"total": 116.04861135804458,
	"count": 63620,
	"self": 115.79287874304464,
	"children": {
	"RLTrainer._checkpoint": {
	"total": 0.2557326149999426,
	"count": 2,
	"self": 0.2557326149999426
	}
	}
	},
	"_update_policy": {
	"total": 576.4819434770034,
	"count": 457,
	"self": 373.6968971189767,
	"children": {
	"TorchPPOOptimizer.update": {
	"total": 202.78504635802665,
	"count": 22761,
	"self": 202.78504635802665
	}
	}
	}
	}
	}
	}
	},
	"trainer_threads": {
	"total": 1.3489998309523799e-06,
	"count": 1,
	"self": 1.3489998309523799e-06
	},
	"TrainerController._save_models": {
	"total": 0.15773507799985964,
	"count": 1,
	"self": 0.0018806959997164086,
	"children": {
	"RLTrainer._checkpoint": {
	"total": 0.15585438200014323,
	"count": 1,
	"self": 0.15585438200014323
	}
	}
	}
	}
	}
	}
	}