{ "name": "root", "gauges": { "Pyramids.Policy.Entropy.mean": { "value": 0.5555771589279175, "min": 0.5555771589279175, "max": 1.3511556386947632, "count": 33 }, "Pyramids.Policy.Entropy.sum": { "value": 16533.9765625, "min": 16533.9765625, "max": 40988.65625, "count": 33 }, "Pyramids.Step.mean": { "value": 989950.0, "min": 29952.0, "max": 989950.0, "count": 33 }, "Pyramids.Step.sum": { "value": 989950.0, "min": 29952.0, "max": 989950.0, "count": 33 }, "Pyramids.Policy.ExtrinsicValueEstimate.mean": { "value": 0.13370367884635925, "min": -0.10792555660009384, "max": 0.18158511817455292, "count": 33 }, "Pyramids.Policy.ExtrinsicValueEstimate.sum": { "value": 33.55962371826172, "min": -26.010059356689453, "max": 45.941036224365234, "count": 33 }, "Pyramids.Policy.RndValueEstimate.mean": { "value": 0.005116866901516914, "min": -0.005071492865681648, "max": 0.29099249839782715, "count": 33 }, "Pyramids.Policy.RndValueEstimate.sum": { "value": 1.28433358669281, "min": -1.25773024559021, "max": 68.96522521972656, "count": 33 }, "Pyramids.Losses.PolicyLoss.mean": { "value": 0.04412110306937912, "min": 0.04412110306937912, "max": 0.05179467467004339, "count": 33 }, "Pyramids.Losses.PolicyLoss.sum": { "value": 0.6176954429713077, "min": 0.3625627226903037, "max": 0.7059182961264419, "count": 33 }, "Pyramids.Losses.ValueLoss.mean": { "value": 0.0075576953130231635, "min": 0.0002963896903985677, "max": 0.011014831698115332, "count": 33 }, "Pyramids.Losses.ValueLoss.sum": { "value": 0.10580773438232428, "min": 0.0038530659751813807, "max": 0.11891083483351396, "count": 33 }, "Pyramids.Policy.LearningRate.mean": { "value": 7.222319021164285e-06, "min": 7.222319021164285e-06, "max": 0.00029515063018788575, "count": 33 }, "Pyramids.Policy.LearningRate.sum": { "value": 0.0001011124662963, "min": 0.0001011124662963, "max": 0.0035081342306219994, "count": 33 }, "Pyramids.Policy.Epsilon.mean": { "value": 0.10240740714285712, "min": 0.10240740714285712, "max": 0.19838354285714285, "count": 33 }, "Pyramids.Policy.Epsilon.sum": { "value": 1.4337036999999997, "min": 1.3886848, "max": 2.569378, "count": 33 }, "Pyramids.Policy.Beta.mean": { "value": 0.000491240687857143, "min": 0.000491240687857143, "max": 0.019676870217142855, "count": 33 }, "Pyramids.Policy.Beta.sum": { "value": 0.006877369630000002, "min": 0.006877369630000002, "max": 0.2338986622, "count": 33 }, "Pyramids.Losses.RNDLoss.mean": { "value": 0.010875050909817219, "min": 0.010875050909817219, "max": 0.5158635377883911, "count": 33 }, "Pyramids.Losses.RNDLoss.sum": { "value": 0.15225070714950562, "min": 0.15225070714950562, "max": 3.6110448837280273, "count": 33 }, "Pyramids.Environment.EpisodeLength.mean": { "value": 724.4878048780488, "min": 673.8666666666667, "max": 999.0, "count": 33 }, "Pyramids.Environment.EpisodeLength.sum": { "value": 29704.0, "min": 15984.0, "max": 32686.0, "count": 33 }, "Pyramids.Environment.CumulativeReward.mean": { "value": 0.4947511893583507, "min": -1.0000000521540642, "max": 0.6592444040709071, "count": 33 }, "Pyramids.Environment.CumulativeReward.sum": { "value": 20.28479876369238, "min": -30.514801643788815, "max": 29.665998183190823, "count": 33 }, "Pyramids.Policy.ExtrinsicReward.mean": { "value": 0.4947511893583507, "min": -1.0000000521540642, "max": 0.6592444040709071, "count": 33 }, "Pyramids.Policy.ExtrinsicReward.sum": { "value": 20.28479876369238, "min": -30.514801643788815, "max": 29.665998183190823, "count": 33 }, "Pyramids.Policy.RndReward.mean": { "value": 0.1651188201184396, "min": 0.1591329200620142, "max": 21.3197267241776, "count": 33 }, "Pyramids.Policy.RndReward.sum": { "value": 6.769871624856023, "min": 6.769871624856023, "max": 341.1156275868416, "count": 33 }, "Pyramids.IsTraining.mean": { "value": 1.0, "min": 1.0, "max": 1.0, "count": 33 }, "Pyramids.IsTraining.sum": { "value": 1.0, "min": 1.0, "max": 1.0, "count": 33 } }, "metadata": { "timer_format_version": "0.1.0", "start_time_seconds": "1700922570", "python_version": "3.10.12 (main, Jun 11 2023, 05:26:28) [GCC 11.4.0]", "command_line_arguments": "/usr/local/bin/mlagents-learn ./config/ppo/PyramidsRND.yaml --env=./training-envs-executables/linux/Pyramids/Pyramids --run-id=Pyramids Training --no-graphics", "mlagents_version": "1.1.0.dev0", "mlagents_envs_version": "1.1.0.dev0", "communication_protocol_version": "1.5.0", "pytorch_version": "2.1.0+cu118", "numpy_version": "1.23.5", "end_time_seconds": "1700924950" }, "total": 2379.785221288, "count": 1, "self": 0.4762838050000937, "children": { "run_training.setup": { "total": 0.08426403199996457, "count": 1, "self": 0.08426403199996457 }, "TrainerController.start_learning": { "total": 2379.224673451, "count": 1, "self": 1.7398534759627182, "children": { "TrainerController._reset_env": { "total": 8.880418856000006, "count": 1, "self": 8.880418856000006 }, "TrainerController.advance": { "total": 2368.526796672037, "count": 63256, "self": 1.7748473900987847, "children": { "env_step": { "total": 1561.87138197193, "count": 63256, "self": 1403.8413400508862, "children": { "SubprocessEnvManager._take_step": { "total": 156.9797802110196, "count": 63256, "self": 5.232784402007383, "children": { "TorchPolicy.evaluate": { "total": 151.74699580901222, "count": 62558, "self": 151.74699580901222 } } }, "workers": { "total": 1.0502617100241878, "count": 63256, "self": 0.0, "children": { "worker_root": { "total": 2373.85237076398, "count": 63256, "is_parallel": true, "self": 1110.5320144279963, "children": { "run_training.setup": { "total": 0.0, "count": 0, "is_parallel": true, "self": 0.0, "children": { "steps_from_proto": { "total": 0.004845638000006147, "count": 1, "is_parallel": true, "self": 0.0034575689998064263, "children": { "_process_rank_one_or_two_observation": { "total": 0.001388069000199721, "count": 8, "is_parallel": true, "self": 0.001388069000199721 } } }, "UnityEnvironment.step": { "total": 0.09867285399991488, "count": 1, "is_parallel": true, "self": 0.0006190619998278635, "children": { "UnityEnvironment._generate_step_input": { "total": 0.000484259000018028, "count": 1, "is_parallel": true, "self": 0.000484259000018028 }, "communicator.exchange": { "total": 0.0957939490000399, "count": 1, "is_parallel": true, "self": 0.0957939490000399 }, "steps_from_proto": { "total": 0.0017755840000290846, "count": 1, "is_parallel": true, "self": 0.0003598540000666617, "children": { "_process_rank_one_or_two_observation": { "total": 0.0014157299999624229, "count": 8, "is_parallel": true, "self": 0.0014157299999624229 } } } } } } }, "UnityEnvironment.step": { "total": 1263.320356335984, "count": 63255, "is_parallel": true, "self": 38.128328791952754, "children": { "UnityEnvironment._generate_step_input": { "total": 26.64825646602071, "count": 63255, "is_parallel": true, "self": 26.64825646602071 }, "communicator.exchange": { "total": 1088.3408103369848, "count": 63255, "is_parallel": true, "self": 1088.3408103369848 }, "steps_from_proto": { "total": 110.20296074102555, "count": 63255, "is_parallel": true, "self": 23.23439513398307, "children": { "_process_rank_one_or_two_observation": { "total": 86.96856560704248, "count": 506040, "is_parallel": true, "self": 86.96856560704248 } } } } } } } } } } }, "trainer_advance": { "total": 804.8805673100082, "count": 63256, "self": 3.182003762995919, "children": { "process_trajectory": { "total": 136.600109983013, "count": 63256, "self": 136.3887323480128, "children": { "RLTrainer._checkpoint": { "total": 0.2113776350001899, "count": 2, "self": 0.2113776350001899 } } }, "_update_policy": { "total": 665.0984535639993, "count": 446, "self": 465.9359561330024, "children": { "TorchPPOOptimizer.update": { "total": 199.16249743099695, "count": 18755, "self": 199.16249743099695 } } } } } } }, "trainer_threads": { "total": 9.479999789618887e-07, "count": 1, "self": 9.479999789618887e-07 }, "TrainerController._save_models": { "total": 0.07760349899990615, "count": 1, "self": 0.0014059569998607913, "children": { "RLTrainer._checkpoint": { "total": 0.07619754200004536, "count": 1, "self": 0.07619754200004536 } } } } } } }