| { |
| "name": "root", |
| "gauges": { |
| "Pyramids.Policy.Entropy.mean": { |
| "value": 0.14759185910224915, |
| "min": 0.14025941491127014, |
| "max": 0.33215630054473877, |
| "count": 50 |
| }, |
| "Pyramids.Policy.Entropy.sum": { |
| "value": 4484.43115234375, |
| "min": 4207.7822265625, |
| "max": 10171.9541015625, |
| "count": 50 |
| }, |
| "Pyramids.Step.mean": { |
| "value": 2999999.0, |
| "min": 1529929.0, |
| "max": 2999999.0, |
| "count": 50 |
| }, |
| "Pyramids.Step.sum": { |
| "value": 2999999.0, |
| "min": 1529929.0, |
| "max": 2999999.0, |
| "count": 50 |
| }, |
| "Pyramids.Policy.ExtrinsicValueEstimate.mean": { |
| "value": 0.7630169987678528, |
| "min": 0.5922383666038513, |
| "max": 0.7677894830703735, |
| "count": 50 |
| }, |
| "Pyramids.Policy.ExtrinsicValueEstimate.sum": { |
| "value": 225.0900115966797, |
| "min": 165.23451232910156, |
| "max": 228.03347778320312, |
| "count": 50 |
| }, |
| "Pyramids.Policy.RndValueEstimate.mean": { |
| "value": 0.015491118654608727, |
| "min": 0.008117031306028366, |
| "max": 0.0288896132260561, |
| "count": 50 |
| }, |
| "Pyramids.Policy.RndValueEstimate.sum": { |
| "value": 4.56988000869751, |
| "min": 2.370173215866089, |
| "max": 8.233539581298828, |
| "count": 50 |
| }, |
| "Pyramids.Environment.EpisodeLength.mean": { |
| "value": 242.82203389830508, |
| "min": 222.50746268656715, |
| "max": 325.75, |
| "count": 50 |
| }, |
| "Pyramids.Environment.EpisodeLength.sum": { |
| "value": 28653.0, |
| "min": 26537.0, |
| "max": 31592.0, |
| "count": 50 |
| }, |
| "Pyramids.Environment.CumulativeReward.mean": { |
| "value": 1.7571779478151919, |
| "min": 1.586324718850915, |
| "max": 1.777492522637346, |
| "count": 50 |
| }, |
| "Pyramids.Environment.CumulativeReward.sum": { |
| "value": 207.34699784219265, |
| "min": 145.8119983226061, |
| "max": 238.18399803340435, |
| "count": 50 |
| }, |
| "Pyramids.Policy.ExtrinsicReward.mean": { |
| "value": 1.7571779478151919, |
| "min": 1.586324718850915, |
| "max": 1.777492522637346, |
| "count": 50 |
| }, |
| "Pyramids.Policy.ExtrinsicReward.sum": { |
| "value": 207.34699784219265, |
| "min": 145.8119983226061, |
| "max": 238.18399803340435, |
| "count": 50 |
| }, |
| "Pyramids.Policy.RndReward.mean": { |
| "value": 0.028435185211646504, |
| "min": 0.026604726313148128, |
| "max": 0.06942069130084362, |
| "count": 50 |
| }, |
| "Pyramids.Policy.RndReward.sum": { |
| "value": 3.3553518549742876, |
| "min": 3.3553518549742876, |
| "max": 6.733807056181831, |
| "count": 50 |
| }, |
| "Pyramids.Losses.PolicyLoss.mean": { |
| "value": 0.019560502592163784, |
| "min": 0.019560502592163784, |
| "max": 0.0276279745134525, |
| "count": 50 |
| }, |
| "Pyramids.Losses.PolicyLoss.sum": { |
| "value": 0.05868150777649135, |
| "min": 0.04262920394539833, |
| "max": 0.08060212047537789, |
| "count": 50 |
| }, |
| "Pyramids.Losses.ValueLoss.mean": { |
| "value": 0.01643072345604499, |
| "min": 0.014319621746738752, |
| "max": 0.017897415434320767, |
| "count": 50 |
| }, |
| "Pyramids.Losses.ValueLoss.sum": { |
| "value": 0.04929217036813498, |
| "min": 0.030501069389283656, |
| "max": 0.0536922463029623, |
| "count": 50 |
| }, |
| "Pyramids.Policy.LearningRate.mean": { |
| "value": 1.6612994462666625e-06, |
| "min": 1.6612994462666625e-06, |
| "max": 0.00014845130051624998, |
| "count": 50 |
| }, |
| "Pyramids.Policy.LearningRate.sum": { |
| "value": 4.983898338799987e-06, |
| "min": 4.983898338799987e-06, |
| "max": 0.0004376169541277333, |
| "count": 50 |
| }, |
| "Pyramids.Policy.Epsilon.mean": { |
| "value": 0.10055373333333334, |
| "min": 0.10055373333333334, |
| "max": 0.14948375000000003, |
| "count": 50 |
| }, |
| "Pyramids.Policy.Epsilon.sum": { |
| "value": 0.3016612, |
| "min": 0.2090047333333333, |
| "max": 0.4458722666666667, |
| "count": 50 |
| }, |
| "Pyramids.Policy.Beta.mean": { |
| "value": 6.531795999999988e-05, |
| "min": 6.531795999999988e-05, |
| "max": 0.004953426625, |
| "count": 50 |
| }, |
| "Pyramids.Policy.Beta.sum": { |
| "value": 0.0001959538799999996, |
| "min": 0.0001959538799999996, |
| "max": 0.014602639439999999, |
| "count": 50 |
| }, |
| "Pyramids.Losses.RNDLoss.mean": { |
| "value": 0.011611025780439377, |
| "min": 0.01159887108951807, |
| "max": 0.02117346040904522, |
| "count": 50 |
| }, |
| "Pyramids.Losses.RNDLoss.sum": { |
| "value": 0.03483307734131813, |
| "min": 0.02372013032436371, |
| "max": 0.06352037936449051, |
| "count": 50 |
| }, |
| "Pyramids.IsTraining.mean": { |
| "value": 1.0, |
| "min": 1.0, |
| "max": 1.0, |
| "count": 50 |
| }, |
| "Pyramids.IsTraining.sum": { |
| "value": 1.0, |
| "min": 1.0, |
| "max": 1.0, |
| "count": 50 |
| } |
| }, |
| "metadata": { |
| "timer_format_version": "0.1.0", |
| "start_time_seconds": "1746508706", |
| "python_version": "3.10.12 | packaged by conda-forge | (main, Jun 23 2023, 22:40:32) [GCC 12.3.0]", |
| "command_line_arguments": "/home/txshi/miniconda3/envs/hf-rl-ch5/bin/mlagents-learn ./ml-agents/config/ppo/PyramidsRND.yaml --env=./training-envs-executables/linux/Pyramids/Pyramids --run-id=Pyramids Training --no-graphics --resume", |
| "mlagents_version": "1.2.0.dev0", |
| "mlagents_envs_version": "1.2.0.dev0", |
| "communication_protocol_version": "1.5.0", |
| "pytorch_version": "2.7.0+cu126", |
| "numpy_version": "1.23.5", |
| "end_time_seconds": "1746509653" |
| }, |
| "total": 946.4430587530005, |
| "count": 1, |
| "self": 0.1665285330018378, |
| "children": { |
| "run_training.setup": { |
| "total": 0.015372962998299045, |
| "count": 1, |
| "self": 0.015372962998299045 |
| }, |
| "TrainerController.start_learning": { |
| "total": 946.2611572570004, |
| "count": 1, |
| "self": 0.7353149860136909, |
| "children": { |
| "TrainerController._reset_env": { |
| "total": 1.3560721989997546, |
| "count": 1, |
| "self": 1.3560721989997546 |
| }, |
| "TrainerController.advance": { |
| "total": 944.1236960439855, |
| "count": 98280, |
| "self": 0.6919071292486478, |
| "children": { |
| "env_step": { |
| "total": 628.7653076611532, |
| "count": 98280, |
| "self": 501.679360544118, |
| "children": { |
| "SubprocessEnvManager._take_step": { |
| "total": 126.59082360999855, |
| "count": 98280, |
| "self": 2.55443194534746, |
| "children": { |
| "TorchPolicy.evaluate": { |
| "total": 124.03639166465109, |
| "count": 93817, |
| "self": 124.03639166465109 |
| } |
| } |
| }, |
| "workers": { |
| "total": 0.4951235070366238, |
| "count": 98280, |
| "self": 0.0, |
| "children": { |
| "worker_root": { |
| "total": 945.3021435918654, |
| "count": 98280, |
| "is_parallel": true, |
| "self": 489.8738490467058, |
| "children": { |
| "run_training.setup": { |
| "total": 0.0, |
| "count": 0, |
| "is_parallel": true, |
| "self": 0.0, |
| "children": { |
| "steps_from_proto": { |
| "total": 0.0006208550003066193, |
| "count": 1, |
| "is_parallel": true, |
| "self": 0.0001753210017341189, |
| "children": { |
| "_process_rank_one_or_two_observation": { |
| "total": 0.0004455339985725004, |
| "count": 8, |
| "is_parallel": true, |
| "self": 0.0004455339985725004 |
| } |
| } |
| }, |
| "UnityEnvironment.step": { |
| "total": 0.012712784000541433, |
| "count": 1, |
| "is_parallel": true, |
| "self": 0.00012432600124157034, |
| "children": { |
| "UnityEnvironment._generate_step_input": { |
| "total": 0.00013519099957193248, |
| "count": 1, |
| "is_parallel": true, |
| "self": 0.00013519099957193248 |
| }, |
| "communicator.exchange": { |
| "total": 0.012097856999389478, |
| "count": 1, |
| "is_parallel": true, |
| "self": 0.012097856999389478 |
| }, |
| "steps_from_proto": { |
| "total": 0.00035541000033845194, |
| "count": 1, |
| "is_parallel": true, |
| "self": 8.841799717629328e-05, |
| "children": { |
| "_process_rank_one_or_two_observation": { |
| "total": 0.00026699200316215865, |
| "count": 8, |
| "is_parallel": true, |
| "self": 0.00026699200316215865 |
| } |
| } |
| } |
| } |
| } |
| } |
| }, |
| "UnityEnvironment.step": { |
| "total": 455.4282945451596, |
| "count": 98279, |
| "is_parallel": true, |
| "self": 10.6707104262332, |
| "children": { |
| "UnityEnvironment._generate_step_input": { |
| "total": 6.716008393870652, |
| "count": 98279, |
| "is_parallel": true, |
| "self": 6.716008393870652 |
| }, |
| "communicator.exchange": { |
| "total": 409.69189717502195, |
| "count": 98279, |
| "is_parallel": true, |
| "self": 409.69189717502195 |
| }, |
| "steps_from_proto": { |
| "total": 28.349678550033786, |
| "count": 98279, |
| "is_parallel": true, |
| "self": 6.308964319758161, |
| "children": { |
| "_process_rank_one_or_two_observation": { |
| "total": 22.040714230275626, |
| "count": 786232, |
| "is_parallel": true, |
| "self": 22.040714230275626 |
| } |
| } |
| } |
| } |
| } |
| } |
| } |
| } |
| } |
| } |
| }, |
| "trainer_advance": { |
| "total": 314.6664812535837, |
| "count": 98280, |
| "self": 1.5202239386580914, |
| "children": { |
| "process_trajectory": { |
| "total": 79.52096247990994, |
| "count": 98280, |
| "self": 79.37046390090836, |
| "children": { |
| "RLTrainer._checkpoint": { |
| "total": 0.15049857900157804, |
| "count": 3, |
| "self": 0.15049857900157804 |
| } |
| } |
| }, |
| "_update_policy": { |
| "total": 233.62529483501567, |
| "count": 145, |
| "self": 185.6884477689655, |
| "children": { |
| "TorchPPOOptimizer.update": { |
| "total": 47.93684706605018, |
| "count": 7250, |
| "self": 47.93684706605018 |
| } |
| } |
| } |
| } |
| } |
| } |
| }, |
| "trainer_threads": { |
| "total": 4.420016921358183e-07, |
| "count": 1, |
| "self": 4.420016921358183e-07 |
| }, |
| "TrainerController._save_models": { |
| "total": 0.04607358599969302, |
| "count": 1, |
| "self": 0.0011363630001142155, |
| "children": { |
| "RLTrainer._checkpoint": { |
| "total": 0.04493722299957881, |
| "count": 1, |
| "self": 0.04493722299957881 |
| } |
| } |
| } |
| } |
| } |
| } |
| } |