{ "name": "root", "gauges": { "SoccerTwos.Policy.Entropy.mean": { "value": 3.268545627593994, "min": 3.268545627593994, "max": 3.2688074111938477, "count": 2 }, "SoccerTwos.Policy.Entropy.sum": { "value": 65370.9140625, "min": 65370.9140625, "max": 104601.8359375, "count": 2 }, "SoccerTwos.Environment.EpisodeLength.mean": { "value": 660.6666666666666, "min": 657.1, "max": 660.6666666666666, "count": 2 }, "SoccerTwos.Environment.EpisodeLength.sum": { "value": 7928.0, "min": 7928.0, "max": 26284.0, "count": 2 }, "SoccerTwos.Self-play.ELO.mean": { "value": 1199.2933648526175, "min": 1198.4233408102318, "max": 1199.2933648526175, "count": 2 }, "SoccerTwos.Self-play.ELO.sum": { "value": 4797.17345941047, "min": 4797.17345941047, "max": 11984.233408102318, "count": 2 }, "SoccerTwos.Step.mean": { "value": 129555.0, "min": 119210.0, "max": 129555.0, "count": 2 }, "SoccerTwos.Step.sum": { "value": 129555.0, "min": 119210.0, "max": 129555.0, "count": 2 }, "SoccerTwos.Policy.ExtrinsicBaselineEstimate.mean": { "value": 0.04442071542143822, "min": 0.04442071542143822, "max": 0.04516923800110817, "count": 2 }, "SoccerTwos.Policy.ExtrinsicBaselineEstimate.sum": { "value": 0.5330485701560974, "min": 0.5330485701560974, "max": 0.5872001051902771, "count": 2 }, "SoccerTwos.Policy.ExtrinsicValueEstimate.mean": { "value": 0.04456588253378868, "min": 0.04456588253378868, "max": 0.04510977119207382, "count": 2 }, "SoccerTwos.Policy.ExtrinsicValueEstimate.sum": { "value": 0.534790575504303, "min": 0.534790575504303, "max": 0.5864270329475403, "count": 2 }, "SoccerTwos.Environment.CumulativeReward.mean": { "value": 0.0, "min": 0.0, "max": 0.0, "count": 2 }, "SoccerTwos.Environment.CumulativeReward.sum": { "value": 0.0, "min": 0.0, "max": 0.0, "count": 2 }, "SoccerTwos.Policy.ExtrinsicReward.mean": { "value": 0.13798333704471588, "min": 0.05710769616640531, "max": 0.13798333704471588, "count": 2 }, "SoccerTwos.Policy.ExtrinsicReward.sum": { "value": 1.6558000445365906, "min": 0.742400050163269, "max": 1.6558000445365906, "count": 2 }, "SoccerTwos.Environment.GroupCumulativeReward.mean": { "value": 0.13798333704471588, "min": 0.05710769616640531, "max": 0.13798333704471588, "count": 2 }, "SoccerTwos.Environment.GroupCumulativeReward.sum": { "value": 1.6558000445365906, "min": 0.742400050163269, "max": 1.6558000445365906, "count": 2 }, "SoccerTwos.IsTraining.mean": { "value": 1.0, "min": 1.0, "max": 1.0, "count": 2 }, "SoccerTwos.IsTraining.sum": { "value": 1.0, "min": 1.0, "max": 1.0, "count": 2 } }, "metadata": { "timer_format_version": "0.1.0", "start_time_seconds": "1685356016", "python_version": "3.9.16 (main, Mar 8 2023, 10:39:24) [MSC v.1916 64 bit (AMD64)]", "command_line_arguments": "D:\\Users\\Karth\\miniconda3\\envs\\rl\\Scripts\\mlagents-learn ./config/poca/SoccerTwos.yaml --env=./training-envs-executables/SoccerTwos.exe --run-id=SoccerTwos --no-graphics --resume", "mlagents_version": "0.31.0.dev0", "mlagents_envs_version": "0.31.0.dev0", "communication_protocol_version": "1.5.0", "pytorch_version": "2.0.1+cpu", "numpy_version": "1.21.2", "end_time_seconds": "1685356254" }, "total": 238.2041421, "count": 1, "self": 3.9869597000000283, "children": { "run_training.setup": { "total": 0.5120532999999998, "count": 1, "self": 0.5120532999999998 }, "TrainerController.start_learning": { "total": 233.7051291, "count": 1, "self": 0.20140879999965478, "children": { "TrainerController._reset_env": { "total": 42.0219721, "count": 1, "self": 42.0219721 }, "TrainerController.advance": { "total": 190.25874190000033, "count": 1780, "self": 0.22091580000071076, "children": { "env_step": { "total": 170.30585719999985, "count": 1780, "self": 130.81243989999928, "children": { "SubprocessEnvManager._take_step": { "total": 39.37364489999948, "count": 1780, "self": 1.2718991999998295, "children": { "TorchPolicy.evaluate": { "total": 38.101745699999654, "count": 3542, "self": 38.101745699999654 } } }, "workers": { "total": 0.11977240000108935, "count": 1779, "self": 0.0, "children": { "worker_root": { "total": 190.64747180000015, "count": 1779, "is_parallel": true, "self": 84.58078559999983, "children": { "steps_from_proto": { "total": 0.008490699999995854, "count": 2, "is_parallel": true, "self": 0.0018218999999746188, "children": { "_process_rank_one_or_two_observation": { "total": 0.0066688000000212355, "count": 8, "is_parallel": true, "self": 0.0066688000000212355 } } }, "UnityEnvironment.step": { "total": 106.05819550000032, "count": 1779, "is_parallel": true, "self": 5.746424800000739, "children": { "UnityEnvironment._generate_step_input": { "total": 4.955105699999756, "count": 1779, "is_parallel": true, "self": 4.955105699999756 }, "communicator.exchange": { "total": 76.44259999999997, "count": 1779, "is_parallel": true, "self": 76.44259999999997 }, "steps_from_proto": { "total": 18.91406499999986, "count": 3558, "is_parallel": true, "self": 3.9178382000003964, "children": { "_process_rank_one_or_two_observation": { "total": 14.996226799999462, "count": 14232, "is_parallel": true, "self": 14.996226799999462 } } } } } } } } } } }, "trainer_advance": { "total": 19.731968899999764, "count": 1779, "self": 0.7386796999991816, "children": { "process_trajectory": { "total": 18.993289200000582, "count": 1779, "self": 18.993289200000582 } } } } }, "trainer_threads": { "total": 6.000000013273166e-06, "count": 1, "self": 6.000000013273166e-06 }, "TrainerController._save_models": { "total": 1.2230002999999954, "count": 1, "self": 0.03244680000000244, "children": { "RLTrainer._checkpoint": { "total": 1.190553499999993, "count": 1, "self": 1.190553499999993 } } } } } } }