{ "name": "root", "gauges": { "SoccerTwos.Policy.Entropy.mean": { "value": 3.0266637802124023, "min": 3.0074007511138916, "max": 3.2957417964935303, "count": 150 }, "SoccerTwos.Policy.Entropy.sum": { "value": 26537.7890625, "min": 11414.236328125, "max": 123887.0703125, "count": 150 }, "SoccerTwos.Environment.EpisodeLength.mean": { "value": 999.0, "min": 366.0, "max": 999.0, "count": 150 }, "SoccerTwos.Environment.EpisodeLength.sum": { "value": 19980.0, "min": 16216.0, "max": 24340.0, "count": 150 }, "SoccerTwos.Self-play.ELO.mean": { "value": 1200.9095637151368, "min": 1200.3979646050168, "max": 1208.0456558895698, "count": 77 }, "SoccerTwos.Self-play.ELO.sum": { "value": 2401.8191274302735, "min": 2400.7959292100336, "max": 26562.48308573179, "count": 77 }, "SoccerTwos.Step.mean": { "value": 1499052.0, "min": 9188.0, "max": 1499052.0, "count": 150 }, "SoccerTwos.Step.sum": { "value": 1499052.0, "min": 9188.0, "max": 1499052.0, "count": 150 }, "SoccerTwos.Policy.ExtrinsicBaselineEstimate.mean": { "value": 0.0002922726853284985, "min": -0.04077611491084099, "max": 0.0026190406642854214, "count": 150 }, "SoccerTwos.Policy.ExtrinsicBaselineEstimate.sum": { "value": 0.002922726795077324, "min": -0.5919223427772522, "max": 0.07595217972993851, "count": 150 }, "SoccerTwos.Policy.ExtrinsicValueEstimate.mean": { "value": 0.00032525171991437674, "min": -0.040881361812353134, "max": 0.0031273856293410063, "count": 150 }, "SoccerTwos.Policy.ExtrinsicValueEstimate.sum": { "value": 0.0032525171991437674, "min": -0.5923647880554199, "max": 0.09069418162107468, "count": 150 }, "SoccerTwos.Environment.CumulativeReward.mean": { "value": 0.0, "min": 0.0, "max": 0.0, "count": 150 }, "SoccerTwos.Environment.CumulativeReward.sum": { "value": 0.0, "min": 0.0, "max": 0.0, "count": 150 }, "SoccerTwos.Policy.ExtrinsicReward.mean": { "value": 0.0, "min": -0.5051034474424247, "max": 0.3945249989628792, "count": 150 }, "SoccerTwos.Policy.ExtrinsicReward.sum": { "value": 0.0, "min": -14.647999975830317, "max": 6.312399983406067, "count": 150 }, "SoccerTwos.Environment.GroupCumulativeReward.mean": { "value": 0.0, "min": -0.5051034474424247, "max": 0.3945249989628792, "count": 150 }, "SoccerTwos.Environment.GroupCumulativeReward.sum": { "value": 0.0, "min": -14.647999975830317, "max": 6.312399983406067, "count": 150 }, "SoccerTwos.IsTraining.mean": { "value": 1.0, "min": 1.0, "max": 1.0, "count": 150 }, "SoccerTwos.IsTraining.sum": { "value": 1.0, "min": 1.0, "max": 1.0, "count": 150 }, "SoccerTwos.Losses.PolicyLoss.mean": { "value": 0.019270571356173605, "min": 0.01109234259929508, "max": 0.022038546949625017, "count": 69 }, "SoccerTwos.Losses.PolicyLoss.sum": { "value": 0.019270571356173605, "min": 0.01109234259929508, "max": 0.022038546949625017, "count": 69 }, "SoccerTwos.Losses.ValueLoss.mean": { "value": 4.058379782160652e-07, "min": 2.2539077188336402e-07, "max": 0.00748855258959035, "count": 69 }, "SoccerTwos.Losses.ValueLoss.sum": { "value": 4.058379782160652e-07, "min": 2.2539077188336402e-07, "max": 0.00748855258959035, "count": 69 }, "SoccerTwos.Losses.BaselineLoss.mean": { "value": 3.1599061856013577e-07, "min": 1.9275289702136434e-07, "max": 0.007870006328448653, "count": 69 }, "SoccerTwos.Losses.BaselineLoss.sum": { "value": 3.1599061856013577e-07, "min": 1.9275289702136434e-07, "max": 0.007870006328448653, "count": 69 }, "SoccerTwos.Policy.LearningRate.mean": { "value": 3.896998701333344e-07, "min": 3.896998701333344e-07, "max": 0.0002955628014790666, "count": 69 }, "SoccerTwos.Policy.LearningRate.sum": { "value": 3.896998701333344e-07, "min": 3.896998701333344e-07, "max": 0.0002955628014790666, "count": 69 }, "SoccerTwos.Policy.Epsilon.mean": { "value": 0.1001298666666667, "min": 0.1001298666666667, "max": 0.1985209333333334, "count": 69 }, "SoccerTwos.Policy.Epsilon.sum": { "value": 0.1001298666666667, "min": 0.1001298666666667, "max": 0.1985209333333334, "count": 69 }, "SoccerTwos.Policy.Beta.mean": { "value": 1.6480346666666688e-05, "min": 1.6480346666666688e-05, "max": 0.004926194573333333, "count": 69 }, "SoccerTwos.Policy.Beta.sum": { "value": 1.6480346666666688e-05, "min": 1.6480346666666688e-05, "max": 0.004926194573333333, "count": 69 } }, "metadata": { "timer_format_version": "0.1.0", "start_time_seconds": "1682416743", "python_version": "3.9.16 | packaged by conda-forge | (main, Feb 1 2023, 21:39:03) \n[GCC 11.3.0]", "command_line_arguments": "/usr/local/bin/mlagents-learn ./config/poca/SoccerTwos.yaml --env=./training-envs-executables/SoccerTwos/SoccerTwos.x86_64 --run-id=SoccerTwos1 --no-graphics", "mlagents_version": "0.31.0.dev0", "mlagents_envs_version": "0.31.0.dev0", "communication_protocol_version": "1.5.0", "pytorch_version": "1.11.0+cu102", "numpy_version": "1.21.2", "end_time_seconds": "1682437942" }, "total": 21199.008036495, "count": 1, "self": 0.7882214160017611, "children": { "run_training.setup": { "total": 0.028646155000160434, "count": 1, "self": 0.028646155000160434 }, "TrainerController.start_learning": { "total": 21198.191168924, "count": 1, "self": 2.9933048658458574, "children": { "TrainerController._reset_env": { "total": 5.077267550999977, "count": 8, "self": 5.077267550999977 }, "TrainerController.advance": { "total": 21189.687087228154, "count": 97775, "self": 3.5816408247337677, "children": { "env_step": { "total": 20508.776001725786, "count": 97775, "self": 19900.856174474404, "children": { "SubprocessEnvManager._take_step": { "total": 605.9272347737397, "count": 97775, "self": 19.04855248140234, "children": { "TorchPolicy.evaluate": { "total": 586.8786822923373, "count": 194110, "self": 586.8786822923373 } } }, "workers": { "total": 1.992592477641665, "count": 97775, "self": 0.0, "children": { "worker_root": { "total": 21159.56748542517, "count": 97775, "is_parallel": true, "self": 1673.710507693202, "children": { "run_training.setup": { "total": 0.0, "count": 0, "is_parallel": true, "self": 0.0, "children": { "steps_from_proto": { "total": 0.0034612699998888274, "count": 2, "is_parallel": true, "self": 0.0007102629997461918, "children": { "_process_rank_one_or_two_observation": { "total": 0.0027510070001426357, "count": 8, "is_parallel": true, "self": 0.0027510070001426357 } } }, "UnityEnvironment.step": { "total": 0.1844313480000892, "count": 1, "is_parallel": true, "self": 0.00035165300027983903, "children": { "UnityEnvironment._generate_step_input": { "total": 0.003827283999953579, "count": 1, "is_parallel": true, "self": 0.003827283999953579 }, "communicator.exchange": { "total": 0.17497757099999944, "count": 1, "is_parallel": true, "self": 0.17497757099999944 }, "steps_from_proto": { "total": 0.00527483999985634, "count": 2, "is_parallel": true, "self": 0.0007120100001429819, "children": { "_process_rank_one_or_two_observation": { "total": 0.004562829999713358, "count": 8, "is_parallel": true, "self": 0.004562829999713358 } } } } } } }, "UnityEnvironment.step": { "total": 19485.827531176965, "count": 97774, "is_parallel": true, "self": 51.70431021806871, "children": { "UnityEnvironment._generate_step_input": { "total": 278.590667788181, "count": 97774, "is_parallel": true, "self": 278.590667788181 }, "communicator.exchange": { "total": 18436.39052922608, "count": 97774, "is_parallel": true, "self": 18436.39052922608 }, "steps_from_proto": { "total": 719.1420239446365, "count": 195548, "is_parallel": true, "self": 95.50878036110021, "children": { "_process_rank_one_or_two_observation": { "total": 623.6332435835363, "count": 782192, "is_parallel": true, "self": 623.6332435835363 } } } } }, "steps_from_proto": { "total": 0.029446555003687536, "count": 14, "is_parallel": true, "self": 0.00425714500624963, "children": { "_process_rank_one_or_two_observation": { "total": 0.025189409997437906, "count": 56, "is_parallel": true, "self": 0.025189409997437906 } } } } } } } } }, "trainer_advance": { "total": 677.3294446776358, "count": 97775, "self": 23.256797303710755, "children": { "process_trajectory": { "total": 175.80368680793185, "count": 97775, "self": 165.98220378292513, "children": { "RLTrainer._checkpoint": { "total": 9.821483025006728, "count": 30, "self": 9.821483025006728 } } }, "_update_policy": { "total": 478.2689605659932, "count": 69, "self": 308.31291992297315, "children": { "TorchPOCAOptimizer.update": { "total": 169.95604064302006, "count": 2070, "self": 169.95604064302006 } } } } } } }, "trainer_threads": { "total": 1.3899989426136017e-06, "count": 1, "self": 1.3899989426136017e-06 }, "TrainerController._save_models": { "total": 0.433507888999884, "count": 1, "self": 0.0025145049985439982, "children": { "RLTrainer._checkpoint": { "total": 0.43099338400134, "count": 1, "self": 0.43099338400134 } } } } } } }