| { |
| "name": "root", |
| "gauges": { |
| "Pyramids.Policy.Entropy.mean": { |
| "value": 0.6534873843193054, |
| "min": 0.6534873843193054, |
| "max": 1.5431253910064697, |
| "count": 33 |
| }, |
| "Pyramids.Policy.Entropy.sum": { |
| "value": 19531.431640625, |
| "min": 19531.431640625, |
| "max": 50713.2734375, |
| "count": 33 |
| }, |
| "Pyramids.Step.mean": { |
| "value": 989922.0, |
| "min": 29952.0, |
| "max": 989922.0, |
| "count": 33 |
| }, |
| "Pyramids.Step.sum": { |
| "value": 989922.0, |
| "min": 29952.0, |
| "max": 989922.0, |
| "count": 33 |
| }, |
| "Pyramids.Policy.ExtrinsicValueEstimate.mean": { |
| "value": 0.5039507150650024, |
| "min": -0.12338055670261383, |
| "max": 0.5929787755012512, |
| "count": 33 |
| }, |
| "Pyramids.Policy.ExtrinsicValueEstimate.sum": { |
| "value": 138.08248901367188, |
| "min": -29.487953186035156, |
| "max": 163.66213989257812, |
| "count": 33 |
| }, |
| "Pyramids.Policy.RndValueEstimate.mean": { |
| "value": 0.03150377422571182, |
| "min": 0.00490775378420949, |
| "max": 0.4278498888015747, |
| "count": 33 |
| }, |
| "Pyramids.Policy.RndValueEstimate.sum": { |
| "value": 8.632034301757812, |
| "min": 1.2969324588775635, |
| "max": 100.11687469482422, |
| "count": 33 |
| }, |
| "Pyramids.Losses.PolicyLoss.mean": { |
| "value": 0.06848002173091645, |
| "min": 0.06330861079775439, |
| "max": 0.07399730283015296, |
| "count": 33 |
| }, |
| "Pyramids.Losses.PolicyLoss.sum": { |
| "value": 0.9587203042328304, |
| "min": 0.4844167022529291, |
| "max": 1.0347373552549648, |
| "count": 33 |
| }, |
| "Pyramids.Losses.ValueLoss.mean": { |
| "value": 0.016658629933530296, |
| "min": 0.0010643052913413462, |
| "max": 0.016658629933530296, |
| "count": 33 |
| }, |
| "Pyramids.Losses.ValueLoss.sum": { |
| "value": 0.23322081906942416, |
| "min": 0.007450137039389423, |
| "max": 0.23322081906942416, |
| "count": 33 |
| }, |
| "Pyramids.Policy.LearningRate.mean": { |
| "value": 7.547733198407141e-06, |
| "min": 7.547733198407141e-06, |
| "max": 0.0002950848016384, |
| "count": 33 |
| }, |
| "Pyramids.Policy.LearningRate.sum": { |
| "value": 0.00010566826477769997, |
| "min": 0.00010566826477769997, |
| "max": 0.0027920981693007004, |
| "count": 33 |
| }, |
| "Pyramids.Policy.Epsilon.mean": { |
| "value": 0.10251587857142859, |
| "min": 0.10251587857142859, |
| "max": 0.19836159999999997, |
| "count": 33 |
| }, |
| "Pyramids.Policy.Epsilon.sum": { |
| "value": 1.4352223000000002, |
| "min": 1.3684608000000003, |
| "max": 2.2755587, |
| "count": 33 |
| }, |
| "Pyramids.Policy.Beta.mean": { |
| "value": 0.0002613362692857142, |
| "min": 0.0002613362692857142, |
| "max": 0.00983632384, |
| "count": 33 |
| }, |
| "Pyramids.Policy.Beta.sum": { |
| "value": 0.003658707769999999, |
| "min": 0.003658707769999999, |
| "max": 0.09309686007000001, |
| "count": 33 |
| }, |
| "Pyramids.Losses.RNDLoss.mean": { |
| "value": 0.013311014510691166, |
| "min": 0.013190694153308868, |
| "max": 0.4133564829826355, |
| "count": 33 |
| }, |
| "Pyramids.Losses.RNDLoss.sum": { |
| "value": 0.18635420501232147, |
| "min": 0.18466971814632416, |
| "max": 2.8934953212738037, |
| "count": 33 |
| }, |
| "Pyramids.IsTraining.mean": { |
| "value": 1.0, |
| "min": 1.0, |
| "max": 1.0, |
| "count": 33 |
| }, |
| "Pyramids.IsTraining.sum": { |
| "value": 1.0, |
| "min": 1.0, |
| "max": 1.0, |
| "count": 33 |
| }, |
| "Pyramids.Environment.EpisodeLength.mean": { |
| "value": 323.0978260869565, |
| "min": 323.0978260869565, |
| "max": 999.0, |
| "count": 32 |
| }, |
| "Pyramids.Environment.EpisodeLength.sum": { |
| "value": 29725.0, |
| "min": 1685.0, |
| "max": 62214.0, |
| "count": 32 |
| }, |
| "Pyramids.Environment.CumulativeReward.mean": { |
| "value": 1.654105468601971, |
| "min": -1.0000000521540642, |
| "max": 1.6611124759539961, |
| "count": 32 |
| }, |
| "Pyramids.Environment.CumulativeReward.sum": { |
| "value": 150.52359764277935, |
| "min": -58.27420325577259, |
| "max": 150.52359764277935, |
| "count": 32 |
| }, |
| "Pyramids.Policy.ExtrinsicReward.mean": { |
| "value": 1.654105468601971, |
| "min": -1.0000000521540642, |
| "max": 1.6611124759539961, |
| "count": 32 |
| }, |
| "Pyramids.Policy.ExtrinsicReward.sum": { |
| "value": 150.52359764277935, |
| "min": -58.27420325577259, |
| "max": 150.52359764277935, |
| "count": 32 |
| }, |
| "Pyramids.Policy.RndReward.mean": { |
| "value": 0.04542399158142891, |
| "min": 0.04542399158142891, |
| "max": 4.694267954826355, |
| "count": 32 |
| }, |
| "Pyramids.Policy.RndReward.sum": { |
| "value": 4.133583233910031, |
| "min": 1.8478424977511168, |
| "max": 117.35669887065887, |
| "count": 32 |
| } |
| }, |
| "metadata": { |
| "timer_format_version": "0.1.0", |
| "start_time_seconds": "1682276088", |
| "python_version": "3.9.16 | packaged by conda-forge | (main, Feb 1 2023, 21:39:03) \n[GCC 11.3.0]", |
| "command_line_arguments": "/home/byron/miniconda3/envs/torch/bin/mlagents-learn ./ml-agents/config/ppo/PyramidsRND.yaml --env=./ml-agents/training-envs-executables/linux/Pyramids/Pyramids --run-id=Pyramids Training2 --no-graphics --torch-device=cuda:0 --num-envs 4 --num-areas 8", |
| "mlagents_version": "0.31.0.dev0", |
| "mlagents_envs_version": "0.31.0.dev0", |
| "communication_protocol_version": "1.5.0", |
| "pytorch_version": "1.13.1+cu117", |
| "numpy_version": "1.21.2", |
| "end_time_seconds": "1682277165" |
| }, |
| "total": 1076.351261099, |
| "count": 1, |
| "self": 0.4212915969983442, |
| "children": { |
| "run_training.setup": { |
| "total": 0.023083496998879127, |
| "count": 1, |
| "self": 0.023083496998879127 |
| }, |
| "TrainerController.start_learning": { |
| "total": 1075.906886005003, |
| "count": 1, |
| "self": 1.1175611507642316, |
| "children": { |
| "TrainerController._reset_env": { |
| "total": 12.854328707995592, |
| "count": 1, |
| "self": 12.854328707995592 |
| }, |
| "TrainerController.advance": { |
| "total": 1061.8692720722465, |
| "count": 50711, |
| "self": 1.0072531040204922, |
| "children": { |
| "env_step": { |
| "total": 308.1554301210999, |
| "count": 50711, |
| "self": 127.75338604554418, |
| "children": { |
| "SubprocessEnvManager._take_step": { |
| "total": 179.70773294112587, |
| "count": 63944, |
| "self": 3.6913824499060865, |
| "children": { |
| "TorchPolicy.evaluate": { |
| "total": 176.01635049121978, |
| "count": 62735, |
| "self": 176.01635049121978 |
| } |
| } |
| }, |
| "workers": { |
| "total": 0.6943111344298813, |
| "count": 50711, |
| "self": 0.0, |
| "children": { |
| "worker_root": { |
| "total": 4300.106483937736, |
| "count": 63941, |
| "is_parallel": true, |
| "self": 3397.442163723812, |
| "children": { |
| "run_training.setup": { |
| "total": 0.0, |
| "count": 0, |
| "is_parallel": true, |
| "self": 0.0, |
| "children": { |
| "steps_from_proto": { |
| "total": 0.004771393985720351, |
| "count": 4, |
| "is_parallel": true, |
| "self": 0.00135901098838076, |
| "children": { |
| "_process_rank_one_or_two_observation": { |
| "total": 0.0034123829973395914, |
| "count": 32, |
| "is_parallel": true, |
| "self": 0.0034123829973395914 |
| } |
| } |
| }, |
| "UnityEnvironment.step": { |
| "total": 0.12181193399010226, |
| "count": 4, |
| "is_parallel": true, |
| "self": 0.000998283998342231, |
| "children": { |
| "UnityEnvironment._generate_step_input": { |
| "total": 0.0016725879977457225, |
| "count": 4, |
| "is_parallel": true, |
| "self": 0.0016725879977457225 |
| }, |
| "communicator.exchange": { |
| "total": 0.11608262499794364, |
| "count": 4, |
| "is_parallel": true, |
| "self": 0.11608262499794364 |
| }, |
| "steps_from_proto": { |
| "total": 0.003058436996070668, |
| "count": 4, |
| "is_parallel": true, |
| "self": 0.0007625639991601929, |
| "children": { |
| "_process_rank_one_or_two_observation": { |
| "total": 0.002295872996910475, |
| "count": 32, |
| "is_parallel": true, |
| "self": 0.002295872996910475 |
| } |
| } |
| } |
| } |
| } |
| } |
| }, |
| "UnityEnvironment.step": { |
| "total": 902.6643202139239, |
| "count": 63937, |
| "is_parallel": true, |
| "self": 16.631254727501073, |
| "children": { |
| "UnityEnvironment._generate_step_input": { |
| "total": 12.274879490956664, |
| "count": 63937, |
| "is_parallel": true, |
| "self": 12.274879490956664 |
| }, |
| "communicator.exchange": { |
| "total": 828.0996875454002, |
| "count": 63937, |
| "is_parallel": true, |
| "self": 828.0996875454002 |
| }, |
| "steps_from_proto": { |
| "total": 45.65849845006596, |
| "count": 63937, |
| "is_parallel": true, |
| "self": 11.43318056021235, |
| "children": { |
| "_process_rank_one_or_two_observation": { |
| "total": 34.22531788985361, |
| "count": 511496, |
| "is_parallel": true, |
| "self": 34.22531788985361 |
| } |
| } |
| } |
| } |
| } |
| } |
| } |
| } |
| } |
| } |
| }, |
| "trainer_advance": { |
| "total": 752.7065888471261, |
| "count": 50711, |
| "self": 2.05000208268757, |
| "children": { |
| "process_trajectory": { |
| "total": 120.992824682442, |
| "count": 50711, |
| "self": 120.85008095644298, |
| "children": { |
| "RLTrainer._checkpoint": { |
| "total": 0.14274372599902563, |
| "count": 2, |
| "self": 0.14274372599902563 |
| } |
| } |
| }, |
| "_update_policy": { |
| "total": 629.6637620819965, |
| "count": 420, |
| "self": 310.2301196816261, |
| "children": { |
| "TorchPPOOptimizer.update": { |
| "total": 319.43364240037045, |
| "count": 22926, |
| "self": 319.43364240037045 |
| } |
| } |
| } |
| } |
| } |
| } |
| }, |
| "trainer_threads": { |
| "total": 6.999907782301307e-07, |
| "count": 1, |
| "self": 6.999907782301307e-07 |
| }, |
| "TrainerController._save_models": { |
| "total": 0.06572337400575634, |
| "count": 1, |
| "self": 0.0007505450048483908, |
| "children": { |
| "RLTrainer._checkpoint": { |
| "total": 0.06497282900090795, |
| "count": 1, |
| "self": 0.06497282900090795 |
| } |
| } |
| } |
| } |
| } |
| } |
| } |