{ "name": "root", "gauges": { "Pyramids.Policy.Entropy.mean": { "value": 0.49476349353790283, "min": 0.4852714538574219, "max": 1.4339741468429565, "count": 26 }, "Pyramids.Policy.Entropy.sum": { "value": 14977.48046875, "min": 14538.595703125, "max": 43501.0390625, "count": 26 }, "Pyramids.Step.mean": { "value": 779914.0, "min": 29952.0, "max": 779914.0, "count": 26 }, "Pyramids.Step.sum": { "value": 779914.0, "min": 29952.0, "max": 779914.0, "count": 26 }, "Pyramids.Policy.ExtrinsicValueEstimate.mean": { "value": 0.3168967366218567, "min": -0.12174516171216965, "max": 0.3173356056213379, "count": 26 }, "Pyramids.Policy.ExtrinsicValueEstimate.sum": { "value": 83.66073608398438, "min": -28.85360336303711, "max": 83.66073608398438, "count": 26 }, "Pyramids.Policy.RndValueEstimate.mean": { "value": 0.0046995291486382484, "min": 0.0033017457462847233, "max": 0.4047175347805023, "count": 26 }, "Pyramids.Policy.RndValueEstimate.sum": { "value": 1.240675687789917, "min": 0.8155311942100525, "max": 95.91805267333984, "count": 26 }, "Pyramids.Losses.PolicyLoss.mean": { "value": 0.06966448413108342, "min": 0.06553156230515046, "max": 0.07370801784734896, "count": 26 }, "Pyramids.Losses.PolicyLoss.sum": { "value": 0.9753027778351679, "min": 0.4833440314229021, "max": 1.0600366913268398, "count": 26 }, "Pyramids.Losses.ValueLoss.mean": { "value": 0.018042720152672182, "min": 3.756502231914526e-05, "max": 0.018042720152672182, "count": 26 }, "Pyramids.Losses.ValueLoss.sum": { "value": 0.25259808213741053, "min": 0.0004883452901488884, "max": 0.25259808213741053, "count": 26 }, "Pyramids.Policy.LearningRate.mean": { "value": 1.2960176037116072e-05, "min": 1.2960176037116072e-05, "max": 0.00029393828773485714, "count": 26 }, "Pyramids.Policy.LearningRate.sum": { "value": 0.000181442464519625, "min": 0.000181442464519625, "max": 0.0033915905444698753, "count": 26 }, "Pyramids.Policy.Epsilon.mean": { "value": 0.1043200267857143, "min": 0.1043200267857143, "max": 0.19797942857142856, "count": 26 }, "Pyramids.Policy.Epsilon.sum": { "value": 1.4604803750000002, "min": 1.3613920000000002, "max": 2.51128725, "count": 26 }, "Pyramids.Policy.Beta.mean": { "value": 0.0004415706758928571, "min": 0.0004415706758928571, "max": 0.009798144914285713, "count": 26 }, "Pyramids.Policy.Beta.sum": { "value": 0.0061819894625, "min": 0.0061819894625, "max": 0.11306995948750001, "count": 26 }, "Pyramids.Losses.RNDLoss.mean": { "value": 0.013691753149032593, "min": 0.013691753149032593, "max": 0.46661216020584106, "count": 26 }, "Pyramids.Losses.RNDLoss.sum": { "value": 0.1916845440864563, "min": 0.1916845440864563, "max": 3.2662851810455322, "count": 26 }, "Pyramids.Environment.EpisodeLength.mean": { "value": 477.4788732394366, "min": 477.4788732394366, "max": 999.0, "count": 26 }, "Pyramids.Environment.EpisodeLength.sum": { "value": 33901.0, "min": 15984.0, "max": 33901.0, "count": 26 }, "Pyramids.Environment.CumulativeReward.mean": { "value": 1.2971041938158827, "min": -1.0000000521540642, "max": 1.2971041938158827, "count": 26 }, "Pyramids.Environment.CumulativeReward.sum": { "value": 92.09439776092768, "min": -32.000001668930054, "max": 92.09439776092768, "count": 26 }, "Pyramids.Policy.ExtrinsicReward.mean": { "value": 1.2971041938158827, "min": -1.0000000521540642, "max": 1.2971041938158827, "count": 26 }, "Pyramids.Policy.ExtrinsicReward.sum": { "value": 92.09439776092768, "min": -32.000001668930054, "max": 92.09439776092768, "count": 26 }, "Pyramids.Policy.RndReward.mean": { "value": 0.06791334474991358, "min": 0.06791334474991358, "max": 9.313939461484551, "count": 26 }, "Pyramids.Policy.RndReward.sum": { "value": 4.821847477243864, "min": 3.9129698085598648, "max": 149.02303138375282, "count": 26 }, "Pyramids.IsTraining.mean": { "value": 1.0, "min": 1.0, "max": 1.0, "count": 26 }, "Pyramids.IsTraining.sum": { "value": 1.0, "min": 1.0, "max": 1.0, "count": 26 } }, "metadata": { "timer_format_version": "0.1.0", "start_time_seconds": "1673412704", "python_version": "3.8.16 (default, Dec 7 2022, 01:12:13) \n[GCC 7.5.0]", "command_line_arguments": "/usr/local/bin/mlagents-learn ./config/ppo/PyramidsRND.yaml --env=./training-envs-executables/linux/Pyramids/Pyramids --run-id=Pyramids Training --no-graphics --force", "mlagents_version": "0.29.0.dev0", "mlagents_envs_version": "0.29.0.dev0", "communication_protocol_version": "1.5.0", "pytorch_version": "1.8.1+cu102", "numpy_version": "1.21.6", "end_time_seconds": "1673414420" }, "total": 1715.4272575219998, "count": 1, "self": 0.44289045599998644, "children": { "run_training.setup": { "total": 0.11044421999986298, "count": 1, "self": 0.11044421999986298 }, "TrainerController.start_learning": { "total": 1714.873922846, "count": 1, "self": 1.1755026050377637, "children": { "TrainerController._reset_env": { "total": 6.708610992000104, "count": 1, "self": 6.708610992000104 }, "TrainerController.advance": { "total": 1706.6131214679617, "count": 50714, "self": 1.1257404760258396, "children": { "env_step": { "total": 1106.7132887349285, "count": 50714, "self": 1013.182600981931, "children": { "SubprocessEnvManager._take_step": { "total": 92.84420582597568, "count": 50714, "self": 3.719329618028951, "children": { "TorchPolicy.evaluate": { "total": 89.12487620794673, "count": 50036, "self": 28.34038994091543, "children": { "TorchPolicy.sample_actions": { "total": 60.7844862670313, "count": 50036, "self": 60.7844862670313 } } } } }, "workers": { "total": 0.6864819270217595, "count": 50714, "self": 0.0, "children": { "worker_root": { "total": 1710.8475445879963, "count": 50714, "is_parallel": true, "self": 781.9695121539357, "children": { "run_training.setup": { "total": 0.0, "count": 0, "is_parallel": true, "self": 0.0, "children": { "steps_from_proto": { "total": 0.0019001539999408124, "count": 1, "is_parallel": true, "self": 0.0007326949994421739, "children": { "_process_rank_one_or_two_observation": { "total": 0.0011674590004986385, "count": 8, "is_parallel": true, "self": 0.0011674590004986385 } } }, "UnityEnvironment.step": { "total": 0.045284408000043186, "count": 1, "is_parallel": true, "self": 0.0005797870003334538, "children": { "UnityEnvironment._generate_step_input": { "total": 0.0005046559999755118, "count": 1, "is_parallel": true, "self": 0.0005046559999755118 }, "communicator.exchange": { "total": 0.0424804609997409, "count": 1, "is_parallel": true, "self": 0.0424804609997409 }, "steps_from_proto": { "total": 0.0017195039999933215, "count": 1, "is_parallel": true, "self": 0.00042736199975479394, "children": { "_process_rank_one_or_two_observation": { "total": 0.0012921420002385275, "count": 8, "is_parallel": true, "self": 0.0012921420002385275 } } } } } } }, "UnityEnvironment.step": { "total": 928.8780324340605, "count": 50713, "is_parallel": true, "self": 23.856492721886752, "children": { "UnityEnvironment._generate_step_input": { "total": 19.09114741005851, "count": 50713, "is_parallel": true, "self": 19.09114741005851 }, "communicator.exchange": { "total": 799.9183385970555, "count": 50713, "is_parallel": true, "self": 799.9183385970555 }, "steps_from_proto": { "total": 86.01205370505977, "count": 50713, "is_parallel": true, "self": 19.120138897982542, "children": { "_process_rank_one_or_two_observation": { "total": 66.89191480707723, "count": 405704, "is_parallel": true, "self": 66.89191480707723 } } } } } } } } } } }, "trainer_advance": { "total": 598.7740922570074, "count": 50714, "self": 2.0756053139748474, "children": { "process_trajectory": { "total": 123.20095220503754, "count": 50714, "self": 122.80800626103746, "children": { "RLTrainer._checkpoint": { "total": 0.39294594400007554, "count": 1, "self": 0.39294594400007554 } } }, "_update_policy": { "total": 473.497534737995, "count": 355, "self": 168.17626016899158, "children": { "TorchPPOOptimizer.update": { "total": 305.32127456900344, "count": 18261, "self": 305.32127456900344 } } } } } } }, "trainer_threads": { "total": 1.184000211651437e-06, "count": 1, "self": 1.184000211651437e-06 }, "TrainerController._save_models": { "total": 0.3766865970001163, "count": 1, "self": 0.00976375500067661, "children": { "RLTrainer._checkpoint": { "total": 0.3669228419994397, "count": 1, "self": 0.3669228419994397 } } } } } } }