{ "name": "root", "gauges": { "Pyramids.Policy.Entropy.mean": { "value": 0.43180933594703674, "min": 0.43126070499420166, "max": 1.5841691493988037, "count": 40 }, "Pyramids.Policy.Entropy.sum": { "value": 13057.9140625, "min": 12861.9189453125, "max": 48057.35546875, "count": 40 }, "Pyramids.Step.mean": { "value": 1199891.0, "min": 29952.0, "max": 1199891.0, "count": 40 }, "Pyramids.Step.sum": { "value": 1199891.0, "min": 29952.0, "max": 1199891.0, "count": 40 }, "Pyramids.Policy.ExtrinsicValueEstimate.mean": { "value": 0.4963719844818115, "min": -0.09791506081819534, "max": 0.4963719844818115, "count": 40 }, "Pyramids.Policy.ExtrinsicValueEstimate.sum": { "value": 135.50955200195312, "min": -23.597530364990234, "max": 135.50955200195312, "count": 40 }, "Pyramids.Policy.RndValueEstimate.mean": { "value": -0.0096103735268116, "min": -0.0096103735268116, "max": 0.1173042431473732, "count": 40 }, "Pyramids.Policy.RndValueEstimate.sum": { "value": -2.6236319541931152, "min": -2.6236319541931152, "max": 28.153018951416016, "count": 40 }, "Pyramids.Losses.PolicyLoss.mean": { "value": 0.04931616802267464, "min": 0.04450815466615105, "max": 0.052197964594438026, "count": 40 }, "Pyramids.Losses.PolicyLoss.sum": { "value": 0.3452131761587225, "min": 0.20525118841958995, "max": 0.3985707801184617, "count": 40 }, "Pyramids.Losses.ValueLoss.mean": { "value": 0.014306249213404953, "min": 0.00017832834793734214, "max": 0.014403587880743933, "count": 40 }, "Pyramids.Losses.ValueLoss.sum": { "value": 0.10014374449383467, "min": 0.0008916417396867106, "max": 0.10336133686359972, "count": 40 }, "Pyramids.Policy.LearningRate.mean": { "value": 3.6113845105238155e-06, "min": 3.6113845105238155e-06, "max": 0.000296208001264, "count": 40 }, "Pyramids.Policy.LearningRate.sum": { "value": 2.5279691573666707e-05, "min": 2.5279691573666707e-05, "max": 0.0018137743454085832, "count": 40 }, "Pyramids.Policy.Epsilon.mean": { "value": 0.1012037619047619, "min": 0.1012037619047619, "max": 0.19873600000000002, "count": 40 }, "Pyramids.Policy.Epsilon.sum": { "value": 0.7084263333333333, "min": 0.7084263333333333, "max": 1.3101369166666668, "count": 40 }, "Pyramids.Policy.Beta.mean": { "value": 0.00013025581428571448, "min": 0.00013025581428571448, "max": 0.009873726399999998, "count": 40 }, "Pyramids.Policy.Beta.sum": { "value": 0.0009117907000000014, "min": 0.0009117907000000014, "max": 0.060468682525, "count": 40 }, "Pyramids.Losses.RNDLoss.mean": { "value": 0.008115310221910477, "min": 0.007542174309492111, "max": 0.18715202808380127, "count": 40 }, "Pyramids.Losses.RNDLoss.sum": { "value": 0.05680717155337334, "min": 0.05279522016644478, "max": 0.7486081123352051, "count": 40 }, "Pyramids.Environment.EpisodeLength.mean": { "value": 383.4230769230769, "min": 383.4230769230769, "max": 999.0, "count": 40 }, "Pyramids.Environment.EpisodeLength.sum": { "value": 29907.0, "min": 15984.0, "max": 33086.0, "count": 40 }, "Pyramids.Environment.CumulativeReward.mean": { "value": 1.5396256252932243, "min": -1.0000000521540642, "max": 1.5396256252932243, "count": 40 }, "Pyramids.Environment.CumulativeReward.sum": { "value": 120.0907987728715, "min": -32.000001668930054, "max": 120.0907987728715, "count": 40 }, "Pyramids.Policy.ExtrinsicReward.mean": { "value": 1.5396256252932243, "min": -1.0000000521540642, "max": 1.5396256252932243, "count": 40 }, "Pyramids.Policy.ExtrinsicReward.sum": { "value": 120.0907987728715, "min": -32.000001668930054, "max": 120.0907987728715, "count": 40 }, "Pyramids.Policy.RndReward.mean": { "value": 0.03217785571140643, "min": 0.03217785571140643, "max": 7.243808610364795, "count": 40 }, "Pyramids.Policy.RndReward.sum": { "value": 2.5098727454897016, "min": 2.2504812776460312, "max": 115.90093776583672, "count": 40 }, "Pyramids.IsTraining.mean": { "value": 1.0, "min": 1.0, "max": 1.0, "count": 40 }, "Pyramids.IsTraining.sum": { "value": 1.0, "min": 1.0, "max": 1.0, "count": 40 } }, "metadata": { "timer_format_version": "0.1.0", "start_time_seconds": "1673448733", "python_version": "3.8.16 (default, Dec 7 2022, 01:12:13) \n[GCC 7.5.0]", "command_line_arguments": "/usr/local/bin/mlagents-learn ./config/ppo/PyramidsRND.yaml --env=./training-envs-executables/linux/Pyramids/Pyramids --run-id=Pyramids Training --no-graphics", "mlagents_version": "0.29.0.dev0", "mlagents_envs_version": "0.29.0.dev0", "communication_protocol_version": "1.5.0", "pytorch_version": "1.8.1+cu102", "numpy_version": "1.21.6", "end_time_seconds": "1673451049" }, "total": 2316.370975376, "count": 1, "self": 0.6260153549997085, "children": { "run_training.setup": { "total": 0.10593957699984458, "count": 1, "self": 0.10593957699984458 }, "TrainerController.start_learning": { "total": 2315.6390204440004, "count": 1, "self": 1.4057620270305051, "children": { "TrainerController._reset_env": { "total": 6.388285214000007, "count": 1, "self": 6.388285214000007 }, "TrainerController.advance": { "total": 2307.7510039419694, "count": 76259, "self": 1.4356994739641777, "children": { "env_step": { "total": 1637.0692565220188, "count": 76259, "self": 1515.5732718749987, "children": { "SubprocessEnvManager._take_step": { "total": 120.61312878302147, "count": 76259, "self": 4.999279493094718, "children": { "TorchPolicy.evaluate": { "total": 115.61384928992675, "count": 75068, "self": 38.78389159491121, "children": { "TorchPolicy.sample_actions": { "total": 76.82995769501554, "count": 75068, "self": 76.82995769501554 } } } } }, "workers": { "total": 0.8828558639986568, "count": 76259, "self": 0.0, "children": { "worker_root": { "total": 2310.5169555260563, "count": 76259, "is_parallel": true, "self": 909.5085581379908, "children": { "run_training.setup": { "total": 0.0, "count": 0, "is_parallel": true, "self": 0.0, "children": { "steps_from_proto": { "total": 0.0016701409999768657, "count": 1, "is_parallel": true, "self": 0.0005794080000214308, "children": { "_process_rank_one_or_two_observation": { "total": 0.001090732999955435, "count": 8, "is_parallel": true, "self": 0.001090732999955435 } } }, "UnityEnvironment.step": { "total": 0.045528187999934744, "count": 1, "is_parallel": true, "self": 0.0005240550001417432, "children": { "UnityEnvironment._generate_step_input": { "total": 0.000475739999956204, "count": 1, "is_parallel": true, "self": 0.000475739999956204 }, "communicator.exchange": { "total": 0.042888253000000987, "count": 1, "is_parallel": true, "self": 0.042888253000000987 }, "steps_from_proto": { "total": 0.0016401399998358102, "count": 1, "is_parallel": true, "self": 0.00048265899999933026, "children": { "_process_rank_one_or_two_observation": { "total": 0.00115748099983648, "count": 8, "is_parallel": true, "self": 0.00115748099983648 } } } } } } }, "UnityEnvironment.step": { "total": 1401.0083973880655, "count": 76258, "is_parallel": true, "self": 32.891922812191524, "children": { "UnityEnvironment._generate_step_input": { "total": 25.949304434957867, "count": 76258, "is_parallel": true, "self": 25.949304434957867 }, "communicator.exchange": { "total": 1224.2630952949764, "count": 76258, "is_parallel": true, "self": 1224.2630952949764 }, "steps_from_proto": { "total": 117.9040748459397, "count": 76258, "is_parallel": true, "self": 25.372826467717005, "children": { "_process_rank_one_or_two_observation": { "total": 92.5312483782227, "count": 610064, "is_parallel": true, "self": 92.5312483782227 } } } } } } } } } } }, "trainer_advance": { "total": 669.2460479459864, "count": 76259, "self": 2.581488622969573, "children": { "process_trajectory": { "total": 169.37972792301798, "count": 76259, "self": 169.18406680901785, "children": { "RLTrainer._checkpoint": { "total": 0.19566111400013142, "count": 2, "self": 0.19566111400013142 } } }, "_update_policy": { "total": 497.2848313999989, "count": 275, "self": 234.75314104901554, "children": { "TorchPPOOptimizer.update": { "total": 262.53169035098335, "count": 13821, "self": 262.53169035098335 } } } } } } }, "trainer_threads": { "total": 8.800002433417831e-07, "count": 1, "self": 8.800002433417831e-07 }, "TrainerController._save_models": { "total": 0.09396838100019522, "count": 1, "self": 0.001431187999969552, "children": { "RLTrainer._checkpoint": { "total": 0.09253719300022567, "count": 1, "self": 0.09253719300022567 } } } } } } }