| { |
| "name": "root", |
| "gauges": { |
| "Pyramids.Policy.Entropy.mean": { |
| "value": 0.432526558637619, |
| "min": 0.32225361466407776, |
| "max": 1.5993752479553223, |
| "count": 150 |
| }, |
| "Pyramids.Policy.Entropy.sum": { |
| "value": 4401.39013671875, |
| "min": 3195.638916015625, |
| "max": 16377.6025390625, |
| "count": 150 |
| }, |
| "Pyramids.Step.mean": { |
| "value": 1499903.0, |
| "min": 9984.0, |
| "max": 1499903.0, |
| "count": 150 |
| }, |
| "Pyramids.Step.sum": { |
| "value": 1499903.0, |
| "min": 9984.0, |
| "max": 1499903.0, |
| "count": 150 |
| }, |
| "Pyramids.Policy.ExtrinsicValueEstimate.mean": { |
| "value": 0.04954734072089195, |
| "min": -0.10484987497329712, |
| "max": 0.18645791709423065, |
| "count": 150 |
| }, |
| "Pyramids.Policy.ExtrinsicValueEstimate.sum": { |
| "value": 4.062881946563721, |
| "min": -8.283140182495117, |
| "max": 15.66246509552002, |
| "count": 150 |
| }, |
| "Pyramids.Policy.CuriosityValueEstimate.mean": { |
| "value": 0.11475102603435516, |
| "min": 0.08723638951778412, |
| "max": 0.5798850059509277, |
| "count": 150 |
| }, |
| "Pyramids.Policy.CuriosityValueEstimate.sum": { |
| "value": 9.409584045410156, |
| "min": 7.153383731842041, |
| "max": 46.97068405151367, |
| "count": 150 |
| }, |
| "Pyramids.Losses.PolicyLoss.mean": { |
| "value": 0.06473862011140832, |
| "min": 0.05774385195642632, |
| "max": 0.07875350401352715, |
| "count": 150 |
| }, |
| "Pyramids.Losses.PolicyLoss.sum": { |
| "value": 0.2589544804456333, |
| "min": 0.13296349911252037, |
| "max": 0.38936668815657355, |
| "count": 150 |
| }, |
| "Pyramids.Losses.ValueLoss.mean": { |
| "value": 0.0037324324090756518, |
| "min": 7.420701751145458e-05, |
| "max": 0.009053264769439314, |
| "count": 150 |
| }, |
| "Pyramids.Losses.ValueLoss.sum": { |
| "value": 0.014929729636302607, |
| "min": 0.00029682807004581833, |
| "max": 0.03491397371423469, |
| "count": 150 |
| }, |
| "Pyramids.Policy.LearningRate.mean": { |
| "value": 1.0306996564666704e-06, |
| "min": 1.0306996564666704e-06, |
| "max": 0.00029877120040959997, |
| "count": 150 |
| }, |
| "Pyramids.Policy.LearningRate.sum": { |
| "value": 4.122798625866682e-06, |
| "min": 4.122798625866682e-06, |
| "max": 0.0013251332582889333, |
| "count": 150 |
| }, |
| "Pyramids.Policy.Epsilon.mean": { |
| "value": 0.10034353333333335, |
| "min": 0.10034353333333335, |
| "max": 0.1995904, |
| "count": 150 |
| }, |
| "Pyramids.Policy.Epsilon.sum": { |
| "value": 0.4013741333333334, |
| "min": 0.3847936, |
| "max": 0.9417110666666667, |
| "count": 150 |
| }, |
| "Pyramids.Policy.Beta.mean": { |
| "value": 4.431898000000013e-05, |
| "min": 4.431898000000013e-05, |
| "max": 0.009959080959999998, |
| "count": 150 |
| }, |
| "Pyramids.Policy.Beta.sum": { |
| "value": 0.0001772759200000005, |
| "min": 0.0001772759200000005, |
| "max": 0.044176935560000005, |
| "count": 150 |
| }, |
| "Pyramids.Losses.CuriosityForwardLoss.mean": { |
| "value": 0.061895945167634636, |
| "min": 0.06048533997188012, |
| "max": 0.9530652779309701, |
| "count": 150 |
| }, |
| "Pyramids.Losses.CuriosityForwardLoss.sum": { |
| "value": 0.24758378067053854, |
| "min": 0.24758378067053854, |
| "max": 1.9061305558619401, |
| "count": 150 |
| }, |
| "Pyramids.Losses.CuriosityInverseLoss.mean": { |
| "value": 0.06055828338685387, |
| "min": 0.04053960538779696, |
| "max": 0.9808244205390414, |
| "count": 150 |
| }, |
| "Pyramids.Losses.CuriosityInverseLoss.sum": { |
| "value": 0.2422331335474155, |
| "min": 0.16215842155118784, |
| "max": 1.9616488410780828, |
| "count": 150 |
| }, |
| "Pyramids.IsTraining.mean": { |
| "value": 1.0, |
| "min": 1.0, |
| "max": 1.0, |
| "count": 150 |
| }, |
| "Pyramids.IsTraining.sum": { |
| "value": 1.0, |
| "min": 1.0, |
| "max": 1.0, |
| "count": 150 |
| }, |
| "Pyramids.Environment.EpisodeLength.mean": { |
| "value": 628.2727272727273, |
| "min": 364.0, |
| "max": 999.0, |
| "count": 145 |
| }, |
| "Pyramids.Environment.EpisodeLength.sum": { |
| "value": 6911.0, |
| "min": 364.0, |
| "max": 15984.0, |
| "count": 145 |
| }, |
| "Pyramids.Environment.CumulativeReward.mean": { |
| "value": 0.8261090652509169, |
| "min": -1.0000000521540642, |
| "max": 1.6359999477863312, |
| "count": 146 |
| }, |
| "Pyramids.Environment.CumulativeReward.sum": { |
| "value": 9.087199717760086, |
| "min": -16.000000834465027, |
| "max": 9.087199717760086, |
| "count": 146 |
| }, |
| "Pyramids.Policy.ExtrinsicReward.mean": { |
| "value": 0.8261090652509169, |
| "min": -1.0000000521540642, |
| "max": 1.6359999477863312, |
| "count": 146 |
| }, |
| "Pyramids.Policy.ExtrinsicReward.sum": { |
| "value": 9.087199717760086, |
| "min": -16.000000834465027, |
| "max": 9.087199717760086, |
| "count": 146 |
| }, |
| "Pyramids.Policy.CuriosityReward.mean": { |
| "value": 0.8066543743691661, |
| "min": 0.8066543743691661, |
| "max": 7.507157441228628, |
| "count": 146 |
| }, |
| "Pyramids.Policy.CuriosityReward.sum": { |
| "value": 8.873198118060827, |
| "min": 1.2870761454105377, |
| "max": 120.11451905965805, |
| "count": 146 |
| } |
| }, |
| "metadata": { |
| "timer_format_version": "0.1.0", |
| "start_time_seconds": "1771968355", |
| "python_version": "3.10.12 (main, Jan 26 2026, 14:55:28) [GCC 11.4.0]", |
| "command_line_arguments": "/kaggle/working/mlagents-env/bin/mlagents-learn /kaggle/working/ml-agents/config/ppo/Pyramids.yaml --env=./training-envs-executables/Pyramids/Pyramids/Pyramids --run-id=Pyramids1 --no-graphics --force", |
| "mlagents_version": "1.1.0", |
| "mlagents_envs_version": "1.1.0", |
| "communication_protocol_version": "1.5.0", |
| "pytorch_version": "2.0.1+cpu", |
| "numpy_version": "1.23.5", |
| "end_time_seconds": "1771971846" |
| }, |
| "total": 3490.8813013159997, |
| "count": 1, |
| "self": 0.3800962890009032, |
| "children": { |
| "run_training.setup": { |
| "total": 0.016093584999907762, |
| "count": 1, |
| "self": 0.016093584999907762 |
| }, |
| "TrainerController.start_learning": { |
| "total": 3490.485111441999, |
| "count": 1, |
| "self": 1.8422932399635101, |
| "children": { |
| "TrainerController._reset_env": { |
| "total": 0.8198842850006258, |
| "count": 1, |
| "self": 0.8198842850006258 |
| }, |
| "TrainerController.advance": { |
| "total": 3487.768661795034, |
| "count": 94781, |
| "self": 1.8979434687980756, |
| "children": { |
| "env_step": { |
| "total": 2328.233717913111, |
| "count": 94781, |
| "self": 2197.3696197046556, |
| "children": { |
| "SubprocessEnvManager._take_step": { |
| "total": 129.72657525722298, |
| "count": 94781, |
| "self": 7.196937510988391, |
| "children": { |
| "TorchPolicy.evaluate": { |
| "total": 122.52963774623458, |
| "count": 93819, |
| "self": 122.52963774623458 |
| } |
| } |
| }, |
| "workers": { |
| "total": 1.137522951232313, |
| "count": 94781, |
| "self": 0.0, |
| "children": { |
| "worker_root": { |
| "total": 3487.0163712979956, |
| "count": 94781, |
| "is_parallel": true, |
| "self": 1445.7082351739773, |
| "children": { |
| "run_training.setup": { |
| "total": 0.0, |
| "count": 0, |
| "is_parallel": true, |
| "self": 0.0, |
| "children": { |
| "steps_from_proto": { |
| "total": 0.0022598160003326484, |
| "count": 1, |
| "is_parallel": true, |
| "self": 0.0007911549992059008, |
| "children": { |
| "_process_rank_one_or_two_observation": { |
| "total": 0.0014686610011267476, |
| "count": 8, |
| "is_parallel": true, |
| "self": 0.0014686610011267476 |
| } |
| } |
| }, |
| "UnityEnvironment.step": { |
| "total": 0.04300834900004702, |
| "count": 1, |
| "is_parallel": true, |
| "self": 0.0003477970003586961, |
| "children": { |
| "UnityEnvironment._generate_step_input": { |
| "total": 0.0003681289999803994, |
| "count": 1, |
| "is_parallel": true, |
| "self": 0.0003681289999803994 |
| }, |
| "communicator.exchange": { |
| "total": 0.04089825099981681, |
| "count": 1, |
| "is_parallel": true, |
| "self": 0.04089825099981681 |
| }, |
| "steps_from_proto": { |
| "total": 0.001394171999891114, |
| "count": 1, |
| "is_parallel": true, |
| "self": 0.00042417899931024294, |
| "children": { |
| "_process_rank_one_or_two_observation": { |
| "total": 0.000969993000580871, |
| "count": 8, |
| "is_parallel": true, |
| "self": 0.000969993000580871 |
| } |
| } |
| } |
| } |
| } |
| } |
| }, |
| "UnityEnvironment.step": { |
| "total": 2041.3081361240183, |
| "count": 94780, |
| "is_parallel": true, |
| "self": 39.858876127959775, |
| "children": { |
| "UnityEnvironment._generate_step_input": { |
| "total": 29.71144846707284, |
| "count": 94780, |
| "is_parallel": true, |
| "self": 29.71144846707284 |
| }, |
| "communicator.exchange": { |
| "total": 1845.155440685765, |
| "count": 94780, |
| "is_parallel": true, |
| "self": 1845.155440685765 |
| }, |
| "steps_from_proto": { |
| "total": 126.58237084322082, |
| "count": 94780, |
| "is_parallel": true, |
| "self": 26.328388871829702, |
| "children": { |
| "_process_rank_one_or_two_observation": { |
| "total": 100.25398197139111, |
| "count": 758240, |
| "is_parallel": true, |
| "self": 100.25398197139111 |
| } |
| } |
| } |
| } |
| } |
| } |
| } |
| } |
| } |
| } |
| }, |
| "trainer_advance": { |
| "total": 1157.637000413125, |
| "count": 94781, |
| "self": 3.5209788969887086, |
| "children": { |
| "process_trajectory": { |
| "total": 164.55201621413744, |
| "count": 94781, |
| "self": 164.14582424913533, |
| "children": { |
| "RLTrainer._checkpoint": { |
| "total": 0.4061919650021082, |
| "count": 7, |
| "self": 0.4061919650021082 |
| } |
| } |
| }, |
| "_update_policy": { |
| "total": 989.5640053019988, |
| "count": 662, |
| "self": 713.7821614979439, |
| "children": { |
| "TorchPPOOptimizer.update": { |
| "total": 275.7818438040549, |
| "count": 34125, |
| "self": 275.7818438040549 |
| } |
| } |
| } |
| } |
| } |
| } |
| }, |
| "trainer_threads": { |
| "total": 1.0059993655886501e-06, |
| "count": 1, |
| "self": 1.0059993655886501e-06 |
| }, |
| "TrainerController._save_models": { |
| "total": 0.054271116001473274, |
| "count": 1, |
| "self": 0.000733008000679547, |
| "children": { |
| "RLTrainer._checkpoint": { |
| "total": 0.05353810800079373, |
| "count": 1, |
| "self": 0.05353810800079373 |
| } |
| } |
| } |
| } |
| } |
| } |
| } |