{ "name": "root", "gauges": { "SoccerTwos.Policy.Entropy.mean": { "value": 1.442643404006958, "min": 1.3646326065063477, "max": 1.5156055688858032, "count": 401 }, "SoccerTwos.Policy.Entropy.sum": { "value": 29083.69140625, "min": 964.6746826171875, "max": 34790.27734375, "count": 401 }, "SoccerTwos.Environment.EpisodeLength.mean": { "value": 58.892857142857146, "min": 16.0, "max": 91.64150943396227, "count": 401 }, "SoccerTwos.Environment.EpisodeLength.sum": { "value": 19788.0, "min": 192.0, "max": 20676.0, "count": 401 }, "SoccerTwos.Self-play.ELO.mean": { "value": 1536.758699507207, "min": 1513.376511471752, "max": 1570.2386341842073, "count": 401 }, "SoccerTwos.Self-play.ELO.sum": { "value": 258175.46151721076, "min": 9114.78279783337, "max": 339446.648018735, "count": 401 }, "SoccerTwos.Step.mean": { "value": 29999984.0, "min": 25999991.0, "max": 29999984.0, "count": 401 }, "SoccerTwos.Step.sum": { "value": 29999984.0, "min": 25999991.0, "max": 29999984.0, "count": 401 }, "SoccerTwos.Policy.ExtrinsicBaselineEstimate.mean": { "value": -0.06340470910072327, "min": -0.23134204745292664, "max": 0.08946024626493454, "count": 401 }, "SoccerTwos.Policy.ExtrinsicBaselineEstimate.sum": { "value": -10.65199089050293, "min": -21.37249755859375, "max": 11.450911521911621, "count": 401 }, "SoccerTwos.Policy.ExtrinsicValueEstimate.mean": { "value": -0.0660364106297493, "min": -0.23267503082752228, "max": 0.09010016918182373, "count": 401 }, "SoccerTwos.Policy.ExtrinsicValueEstimate.sum": { "value": -11.094117164611816, "min": -21.51323699951172, "max": 11.532821655273438, "count": 401 }, "SoccerTwos.Environment.CumulativeReward.mean": { "value": 0.0, "min": 0.0, "max": 0.0, "count": 401 }, "SoccerTwos.Environment.CumulativeReward.sum": { "value": 0.0, "min": 0.0, "max": 0.0, "count": 401 }, "SoccerTwos.Policy.ExtrinsicReward.mean": { "value": -0.37794047523112523, "min": -1.0, "max": 0.3092654096255512, "count": 401 }, "SoccerTwos.Policy.ExtrinsicReward.sum": { "value": -63.49399983882904, "min": -63.49399983882904, "max": 49.17320013046265, "count": 401 }, "SoccerTwos.Environment.GroupCumulativeReward.mean": { "value": -0.37794047523112523, "min": -1.0, "max": 0.3092654096255512, "count": 401 }, "SoccerTwos.Environment.GroupCumulativeReward.sum": { "value": -63.49399983882904, "min": -63.49399983882904, "max": 49.17320013046265, "count": 401 }, "SoccerTwos.IsTraining.mean": { "value": 1.0, "min": 1.0, "max": 1.0, "count": 401 }, "SoccerTwos.IsTraining.sum": { "value": 1.0, "min": 1.0, "max": 1.0, "count": 401 }, "SoccerTwos.Losses.PolicyLoss.mean": { "value": 0.015637130175794784, "min": 0.011390995223094554, "max": 0.025345727618938933, "count": 194 }, "SoccerTwos.Losses.PolicyLoss.sum": { "value": 0.015637130175794784, "min": 0.011390995223094554, "max": 0.025345727618938933, "count": 194 }, "SoccerTwos.Losses.ValueLoss.mean": { "value": 0.10095099707444509, "min": 0.07894389082988103, "max": 0.11518443673849106, "count": 194 }, "SoccerTwos.Losses.ValueLoss.sum": { "value": 0.10095099707444509, "min": 0.07894389082988103, "max": 0.11518443673849106, "count": 194 }, "SoccerTwos.Losses.BaselineLoss.mean": { "value": 0.10293505663673083, "min": 0.0800147719681263, "max": 0.11697089771429697, "count": 194 }, "SoccerTwos.Losses.BaselineLoss.sum": { "value": 0.10293505663673083, "min": 0.0800147719681263, "max": 0.11697089771429697, "count": 194 }, "SoccerTwos.Policy.LearningRate.mean": { "value": 0.0003, "min": 0.0003, "max": 0.0003, "count": 194 }, "SoccerTwos.Policy.LearningRate.sum": { "value": 0.0003, "min": 0.0003, "max": 0.0003, "count": 194 }, "SoccerTwos.Policy.Epsilon.mean": { "value": 0.20000000000000007, "min": 0.20000000000000007, "max": 0.20000000000000007, "count": 194 }, "SoccerTwos.Policy.Epsilon.sum": { "value": 0.20000000000000007, "min": 0.20000000000000007, "max": 0.20000000000000007, "count": 194 }, "SoccerTwos.Policy.Beta.mean": { "value": 0.005000000000000001, "min": 0.005000000000000001, "max": 0.005000000000000001, "count": 194 }, "SoccerTwos.Policy.Beta.sum": { "value": 0.005000000000000001, "min": 0.005000000000000001, "max": 0.005000000000000001, "count": 194 } }, "metadata": { "timer_format_version": "0.1.0", "start_time_seconds": "1683274975", "python_version": "3.9.16 (main, Apr 12 2023, 06:58:15) \n[GCC 10.2.1 20210110]", "command_line_arguments": "/home/adsp/.local/bin/mlagents-learn /app/ml-agents/config/poca/SoccerTwos.yaml --env=/app/ml-agents/training-envs-executables/SoccerTwos/SoccerTwos.x86_64 --run-id=SoccerTwos --no-graphics --resume", "mlagents_version": "0.31.0.dev0", "mlagents_envs_version": "0.31.0.dev0", "communication_protocol_version": "1.5.0", "pytorch_version": "1.11.0+cu102", "numpy_version": "1.21.2", "end_time_seconds": "1683304836" }, "total": 21052.462681778998, "count": 1, "self": 1.3189635519956937, "children": { "run_training.setup": { "total": 0.18352584300004082, "count": 1, "self": 0.18352584300004082 }, "TrainerController.start_learning": { "total": 21050.960192384002, "count": 1, "self": 11.725414112748695, "children": { "TrainerController._reset_env": { "total": 13.553882120002925, "count": 21, "self": 13.553882120002925 }, "TrainerController.advance": { "total": 21025.28174819625, "count": 277300, "self": 11.90760220748416, "children": { "env_step": { "total": 9961.931052763448, "count": 277300, "self": 8486.755533540296, "children": { "SubprocessEnvManager._take_step": { "total": 1468.213213065258, "count": 277300, "self": 66.82326059318234, "children": { "TorchPolicy.evaluate": { "total": 1401.3899524720757, "count": 502138, "self": 1401.3899524720757 } } }, "workers": { "total": 6.962306157894261, "count": 277300, "self": 0.0, "children": { "worker_root": { "total": 21019.985834203908, "count": 277300, "is_parallel": true, "self": 13753.178573381148, "children": { "run_training.setup": { "total": 0.0, "count": 0, "is_parallel": true, "self": 0.0, "children": { "steps_from_proto": { "total": 0.005918918000020312, "count": 2, "is_parallel": true, "self": 0.002527409999970587, "children": { "_process_rank_one_or_two_observation": { "total": 0.0033915080000497255, "count": 8, "is_parallel": true, "self": 0.0033915080000497255 } } }, "UnityEnvironment.step": { "total": 0.060281557000053, "count": 1, "is_parallel": true, "self": 0.00105069500011723, "children": { "UnityEnvironment._generate_step_input": { "total": 0.0009998699999869132, "count": 1, "is_parallel": true, "self": 0.0009998699999869132 }, "communicator.exchange": { "total": 0.05436580899998944, "count": 1, "is_parallel": true, "self": 0.05436580899998944 }, "steps_from_proto": { "total": 0.0038651829999594156, "count": 2, "is_parallel": true, "self": 0.0011909479999303585, "children": { "_process_rank_one_or_two_observation": { "total": 0.002674235000029057, "count": 8, "is_parallel": true, "self": 0.002674235000029057 } } } } } } }, "steps_from_proto": { "total": 0.052836068993315166, "count": 40, "is_parallel": true, "self": 0.011889546985003108, "children": { "_process_rank_one_or_two_observation": { "total": 0.04094652200831206, "count": 160, "is_parallel": true, "self": 0.04094652200831206 } } }, "UnityEnvironment.step": { "total": 7266.754424753766, "count": 277299, "is_parallel": true, "self": 244.94494398424104, "children": { "UnityEnvironment._generate_step_input": { "total": 232.1515300788497, "count": 277299, "is_parallel": true, "self": 232.1515300788497 }, "communicator.exchange": { "total": 6062.591858620617, "count": 277299, "is_parallel": true, "self": 6062.591858620617 }, "steps_from_proto": { "total": 727.0660920700589, "count": 554598, "is_parallel": true, "self": 166.1676294218787, "children": { "_process_rank_one_or_two_observation": { "total": 560.8984626481802, "count": 2218392, "is_parallel": true, "self": 560.8984626481802 } } } } } } } } } } }, "trainer_advance": { "total": 11051.443093225316, "count": 277300, "self": 71.37279218860567, "children": { "process_trajectory": { "total": 1740.5465395717101, "count": 277300, "self": 1735.6465254887112, "children": { "RLTrainer._checkpoint": { "total": 4.900014082999007, "count": 9, "self": 4.900014082999007 } } }, "_update_policy": { "total": 9239.523761465, "count": 194, "self": 1089.3161181191253, "children": { "TorchPOCAOptimizer.update": { "total": 8150.207643345874, "count": 5820, "self": 8150.207643345874 } } } } } } }, "trainer_threads": { "total": 2.9090006137266755e-06, "count": 1, "self": 2.9090006137266755e-06 }, "TrainerController._save_models": { "total": 0.39914504600164946, "count": 1, "self": 0.09269286800190457, "children": { "RLTrainer._checkpoint": { "total": 0.3064521779997449, "count": 1, "self": 0.3064521779997449 } } } } } } }