{ "name": "root", "gauges": { "SoccerTwos.Policy.Entropy.mean": { "value": 3.2140536308288574, "min": 3.1371610164642334, "max": 3.295743227005005, "count": 1000 }, "SoccerTwos.Policy.Entropy.sum": { "value": 87216.5625, "min": 14859.255859375, "max": 123189.3359375, "count": 1000 }, "SoccerTwos.Environment.EpisodeLength.mean": { "value": 689.75, "min": 372.57142857142856, "max": 999.0, "count": 1000 }, "SoccerTwos.Environment.EpisodeLength.sum": { "value": 22072.0, "min": 15984.0, "max": 25980.0, "count": 1000 }, "SoccerTwos.Self-play.ELO.mean": { "value": 1187.6966732241428, "min": 1153.841539058977, "max": 1200.1767817874518, "count": 840 }, "SoccerTwos.Self-play.ELO.sum": { "value": 9501.573385793143, "min": 2307.683078117954, "max": 28693.76147327935, "count": 840 }, "SoccerTwos.Step.mean": { "value": 9999782.0, "min": 9010.0, "max": 9999782.0, "count": 1000 }, "SoccerTwos.Step.sum": { "value": 9999782.0, "min": 9010.0, "max": 9999782.0, "count": 1000 }, "SoccerTwos.Policy.ExtrinsicBaselineEstimate.mean": { "value": -0.01656908541917801, "min": -0.0285890344530344, "max": 0.018183618783950806, "count": 1000 }, "SoccerTwos.Policy.ExtrinsicBaselineEstimate.sum": { "value": -0.24853627383708954, "min": -0.6358370780944824, "max": 0.3091215193271637, "count": 1000 }, "SoccerTwos.Policy.ExtrinsicValueEstimate.mean": { "value": -0.014030274003744125, "min": -0.02842695266008377, "max": 0.006985607091337442, "count": 1000 }, "SoccerTwos.Policy.ExtrinsicValueEstimate.sum": { "value": -0.21045410633087158, "min": -0.5299453735351562, "max": 0.10471726953983307, "count": 1000 }, "SoccerTwos.Environment.CumulativeReward.mean": { "value": 0.0, "min": 0.0, "max": 0.0, "count": 1000 }, "SoccerTwos.Environment.CumulativeReward.sum": { "value": 0.0, "min": 0.0, "max": 0.0, "count": 1000 }, "SoccerTwos.Policy.ExtrinsicReward.mean": { "value": 0.11269332567850748, "min": -0.625, "max": 0.43426666657129925, "count": 1000 }, "SoccerTwos.Policy.ExtrinsicReward.sum": { "value": 1.6903998851776123, "min": -11.209600031375885, "max": 7.816799998283386, "count": 1000 }, "SoccerTwos.Environment.GroupCumulativeReward.mean": { "value": 0.11269332567850748, "min": -0.625, "max": 0.43426666657129925, "count": 1000 }, "SoccerTwos.Environment.GroupCumulativeReward.sum": { "value": 1.6903998851776123, "min": -11.209600031375885, "max": 7.816799998283386, "count": 1000 }, "SoccerTwos.IsTraining.mean": { "value": 1.0, "min": 1.0, "max": 1.0, "count": 1000 }, "SoccerTwos.IsTraining.sum": { "value": 1.0, "min": 1.0, "max": 1.0, "count": 1000 }, "SoccerTwos.Losses.PolicyLoss.mean": { "value": 0.009222518963118395, "min": 0.0018380905045584466, "max": 0.016796006510655086, "count": 466 }, "SoccerTwos.Losses.PolicyLoss.sum": { "value": 0.009222518963118395, "min": 0.0018380905045584466, "max": 0.016796006510655086, "count": 466 }, "SoccerTwos.Losses.ValueLoss.mean": { "value": 0.002672747204390665, "min": 8.787856226414684e-07, "max": 0.01493195490911603, "count": 466 }, "SoccerTwos.Losses.ValueLoss.sum": { "value": 0.002672747204390665, "min": 8.787856226414684e-07, "max": 0.01493195490911603, "count": 466 }, "SoccerTwos.Losses.BaselineLoss.mean": { "value": 0.0026594311154137054, "min": 5.442700323025443e-07, "max": 0.01496061822399497, "count": 466 }, "SoccerTwos.Losses.BaselineLoss.sum": { "value": 0.0026594311154137054, "min": 5.442700323025443e-07, "max": 0.01496061822399497, "count": 466 }, "SoccerTwos.Policy.LearningRate.mean": { "value": 0.0003, "min": 0.0003, "max": 0.0003, "count": 466 }, "SoccerTwos.Policy.LearningRate.sum": { "value": 0.0003, "min": 0.0003, "max": 0.0003, "count": 466 }, "SoccerTwos.Policy.Epsilon.mean": { "value": 0.19999999999999998, "min": 0.19999999999999998, "max": 0.19999999999999998, "count": 466 }, "SoccerTwos.Policy.Epsilon.sum": { "value": 0.19999999999999998, "min": 0.19999999999999998, "max": 0.19999999999999998, "count": 466 }, "SoccerTwos.Policy.Beta.mean": { "value": 0.005, "min": 0.005, "max": 0.005, "count": 466 }, "SoccerTwos.Policy.Beta.sum": { "value": 0.005, "min": 0.005, "max": 0.005, "count": 466 } }, "metadata": { "timer_format_version": "0.1.0", "start_time_seconds": "1714021025", "python_version": "3.10.12 | packaged by conda-forge | (main, Jun 23 2023, 22:40:32) [GCC 12.3.0]", "command_line_arguments": "/opt/conda/envs/rl/bin/mlagents-learn ./config/poca/SoccerTwos.yaml --env=./training-envs-executables/SoccerTwos.x86_64 --run-id=SoccerTwos --no-graphics --force", "mlagents_version": "1.1.0.dev0", "mlagents_envs_version": "1.1.0.dev0", "communication_protocol_version": "1.5.0", "pytorch_version": "2.3.0+cu121", "numpy_version": "1.23.5", "end_time_seconds": "1714042856" }, "total": 21830.642082236, "count": 1, "self": 0.3244513259996893, "children": { "run_training.setup": { "total": 0.023126756000010573, "count": 1, "self": 0.023126756000010573 }, "TrainerController.start_learning": { "total": 21830.294504154, "count": 1, "self": 17.681241414793476, "children": { "TrainerController._reset_env": { "total": 7.963951644991766, "count": 50, "self": 7.963951644991766 }, "TrainerController.advance": { "total": 21804.44504638521, "count": 650905, "self": 18.84673021924391, "children": { "env_step": { "total": 16890.455054930666, "count": 650905, "self": 12782.116950416483, "children": { "SubprocessEnvManager._take_step": { "total": 4097.01059741472, "count": 650905, "self": 126.73519772110421, "children": { "TorchPolicy.evaluate": { "total": 3970.275399693616, "count": 1291756, "self": 3970.275399693616 } } }, "workers": { "total": 11.327507099463446, "count": 650905, "self": 0.0, "children": { "worker_root": { "total": 21802.707380226264, "count": 650905, "is_parallel": true, "self": 11594.57311845469, "children": { "run_training.setup": { "total": 0.0, "count": 0, "is_parallel": true, "self": 0.0, "children": { "steps_from_proto": { "total": 0.0045256380001319485, "count": 2, "is_parallel": true, "self": 0.0011403580003843672, "children": { "_process_rank_one_or_two_observation": { "total": 0.0033852799997475813, "count": 8, "is_parallel": true, "self": 0.0033852799997475813 } } }, "UnityEnvironment.step": { "total": 0.0403048900000158, "count": 1, "is_parallel": true, "self": 0.0009176909998132032, "children": { "UnityEnvironment._generate_step_input": { "total": 0.0010829500001818815, "count": 1, "is_parallel": true, "self": 0.0010829500001818815 }, "communicator.exchange": { "total": 0.03505178000000342, "count": 1, "is_parallel": true, "self": 0.03505178000000342 }, "steps_from_proto": { "total": 0.0032524690000172995, "count": 2, "is_parallel": true, "self": 0.0006490769999345503, "children": { "_process_rank_one_or_two_observation": { "total": 0.0026033920000827493, "count": 8, "is_parallel": true, "self": 0.0026033920000827493 } } } } } } }, "UnityEnvironment.step": { "total": 10207.980765756565, "count": 650904, "is_parallel": true, "self": 507.85822469908635, "children": { "UnityEnvironment._generate_step_input": { "total": 446.99434314346354, "count": 650904, "is_parallel": true, "self": 446.99434314346354 }, "communicator.exchange": { "total": 7188.0503721799605, "count": 650904, "is_parallel": true, "self": 7188.0503721799605 }, "steps_from_proto": { "total": 2065.077825734055, "count": 1301808, "is_parallel": true, "self": 359.3358679757, "children": { "_process_rank_one_or_two_observation": { "total": 1705.7419577583548, "count": 5207232, "is_parallel": true, "self": 1705.7419577583548 } } } } }, "steps_from_proto": { "total": 0.1534960150088409, "count": 98, "is_parallel": true, "self": 0.02746741501323413, "children": { "_process_rank_one_or_two_observation": { "total": 0.12602859999560678, "count": 392, "is_parallel": true, "self": 0.12602859999560678 } } } } } } } } }, "trainer_advance": { "total": 4895.143261235304, "count": 650905, "self": 152.33847000950027, "children": { "process_trajectory": { "total": 1271.8683250818606, "count": 650905, "self": 1267.4993024908624, "children": { "RLTrainer._checkpoint": { "total": 4.369022590998156, "count": 20, "self": 4.369022590998156 } } }, "_update_policy": { "total": 3470.936466143943, "count": 466, "self": 2705.017264349991, "children": { "TorchPOCAOptimizer.update": { "total": 765.9192017939522, "count": 2796, "self": 765.9192017939522 } } } } } } }, "trainer_threads": { "total": 1.200998667627573e-06, "count": 1, "self": 1.200998667627573e-06 }, "TrainerController._save_models": { "total": 0.20426350800335058, "count": 1, "self": 0.001985904003959149, "children": { "RLTrainer._checkpoint": { "total": 0.20227760399939143, "count": 1, "self": 0.20227760399939143 } } } } } } }