{ "name": "root", "gauges": { "SoccerTwos.Policy.Entropy.mean": { "value": 1.8997670412063599, "min": 1.840373158454895, "max": 3.2957375049591064, "count": 500 }, "SoccerTwos.Policy.Entropy.sum": { "value": 38056.1328125, "min": 10524.599609375, "max": 105463.6015625, "count": 500 }, "SoccerTwos.Environment.EpisodeLength.mean": { "value": 52.32631578947368, "min": 36.097744360902254, "max": 999.0, "count": 500 }, "SoccerTwos.Environment.EpisodeLength.sum": { "value": 19884.0, "min": 3996.0, "max": 28936.0, "count": 500 }, "SoccerTwos.Self-play.ELO.mean": { "value": 1579.9891392023628, "min": 1199.95454123925, "max": 1580.9171718560774, "count": 496 }, "SoccerTwos.Self-play.ELO.sum": { "value": 300197.9364484489, "min": 2401.4076928811, "max": 407925.43234129134, "count": 496 }, "SoccerTwos.Step.mean": { "value": 4999984.0, "min": 9484.0, "max": 4999984.0, "count": 500 }, "SoccerTwos.Step.sum": { "value": 4999984.0, "min": 9484.0, "max": 4999984.0, "count": 500 }, "SoccerTwos.Policy.ExtrinsicBaselineEstimate.mean": { "value": -0.000868217321112752, "min": -0.11656514555215836, "max": 0.18462947010993958, "count": 500 }, "SoccerTwos.Policy.ExtrinsicBaselineEstimate.sum": { "value": -0.16409307718276978, "min": -24.012420654296875, "max": 28.973129272460938, "count": 500 }, "SoccerTwos.Policy.ExtrinsicValueEstimate.mean": { "value": 0.00047967469436116517, "min": -0.11385878920555115, "max": 0.19237306714057922, "count": 500 }, "SoccerTwos.Policy.ExtrinsicValueEstimate.sum": { "value": 0.0906585156917572, "min": -23.454910278320312, "max": 30.587318420410156, "count": 500 }, "SoccerTwos.Environment.CumulativeReward.mean": { "value": 0.0, "min": 0.0, "max": 0.0, "count": 500 }, "SoccerTwos.Environment.CumulativeReward.sum": { "value": 0.0, "min": 0.0, "max": 0.0, "count": 500 }, "SoccerTwos.Policy.ExtrinsicReward.mean": { "value": -0.030019048029783543, "min": -0.5433857142925262, "max": 0.46706665886773, "count": 500 }, "SoccerTwos.Policy.ExtrinsicReward.sum": { "value": -5.673600077629089, "min": -55.6139999628067, "max": 65.4522003531456, "count": 500 }, "SoccerTwos.Environment.GroupCumulativeReward.mean": { "value": -0.030019048029783543, "min": -0.5433857142925262, "max": 0.46706665886773, "count": 500 }, "SoccerTwos.Environment.GroupCumulativeReward.sum": { "value": -5.673600077629089, "min": -55.6139999628067, "max": 65.4522003531456, "count": 500 }, "SoccerTwos.IsTraining.mean": { "value": 1.0, "min": 1.0, "max": 1.0, "count": 500 }, "SoccerTwos.IsTraining.sum": { "value": 1.0, "min": 1.0, "max": 1.0, "count": 500 }, "SoccerTwos.Losses.PolicyLoss.mean": { "value": 0.014888953096427333, "min": 0.010700619835794593, "max": 0.022866204695310442, "count": 241 }, "SoccerTwos.Losses.PolicyLoss.sum": { "value": 0.014888953096427333, "min": 0.010700619835794593, "max": 0.022866204695310442, "count": 241 }, "SoccerTwos.Losses.ValueLoss.mean": { "value": 0.11210248867670695, "min": 0.0009040514298249037, "max": 0.12949289282162985, "count": 241 }, "SoccerTwos.Losses.ValueLoss.sum": { "value": 0.11210248867670695, "min": 0.0009040514298249037, "max": 0.12949289282162985, "count": 241 }, "SoccerTwos.Losses.BaselineLoss.mean": { "value": 0.11408566360672315, "min": 0.0009649987869824355, "max": 0.13167524288098018, "count": 241 }, "SoccerTwos.Losses.BaselineLoss.sum": { "value": 0.11408566360672315, "min": 0.0009649987869824355, "max": 0.13167524288098018, "count": 241 }, "SoccerTwos.Policy.LearningRate.mean": { "value": 0.0003, "min": 0.0003, "max": 0.0003, "count": 241 }, "SoccerTwos.Policy.LearningRate.sum": { "value": 0.0003, "min": 0.0003, "max": 0.0003, "count": 241 }, "SoccerTwos.Policy.Epsilon.mean": { "value": 0.20000000000000007, "min": 0.20000000000000004, "max": 0.20000000000000007, "count": 241 }, "SoccerTwos.Policy.Epsilon.sum": { "value": 0.20000000000000007, "min": 0.20000000000000004, "max": 0.20000000000000007, "count": 241 }, "SoccerTwos.Policy.Beta.mean": { "value": 0.005000000000000001, "min": 0.005000000000000001, "max": 0.005000000000000001, "count": 241 }, "SoccerTwos.Policy.Beta.sum": { "value": 0.005000000000000001, "min": 0.005000000000000001, "max": 0.005000000000000001, "count": 241 } }, "metadata": { "timer_format_version": "0.1.0", "start_time_seconds": "1687784021", "python_version": "3.9.16 (main, May 17 2023, 17:49:16) [MSC v.1916 64 bit (AMD64)]", "command_line_arguments": "C:\\Users\\HP\\anaconda3\\envs\\rl\\Scripts\\mlagents-learn ./config/poca/SoccerTwos.yaml --env=./training-envs-executables/SoccerTwos.exe --run-id=SoccerTwos --no-graphics --force", "mlagents_version": "0.31.0.dev0", "mlagents_envs_version": "0.31.0.dev0", "communication_protocol_version": "1.5.0", "pytorch_version": "2.0.1+cpu", "numpy_version": "1.21.2", "end_time_seconds": "1687814403" }, "total": 30379.0671534, "count": 1, "self": 3.225056199997198, "children": { "run_training.setup": { "total": 0.4295460000000002, "count": 1, "self": 0.4295460000000002 }, "TrainerController.start_learning": { "total": 30375.412551200003, "count": 1, "self": 13.868539799113933, "children": { "TrainerController._reset_env": { "total": 83.5566681999994, "count": 25, "self": 83.5566681999994 }, "TrainerController.advance": { "total": 30277.367302100887, "count": 346113, "self": 15.163051399264077, "children": { "env_step": { "total": 10664.192402000728, "count": 346113, "self": 8449.588225302014, "children": { "SubprocessEnvManager._take_step": { "total": 2206.184901599864, "count": 346113, "self": 84.61793239926374, "children": { "TorchPolicy.evaluate": { "total": 2121.5669692006004, "count": 630058, "self": 2121.5669692006004 } } }, "workers": { "total": 8.419275098851003, "count": 346113, "self": 0.0, "children": { "worker_root": { "total": 30271.26001469957, "count": 346113, "is_parallel": true, "self": 23406.947119200326, "children": { "steps_from_proto": { "total": 0.08018039999564053, "count": 50, "is_parallel": true, "self": 0.01708030000916949, "children": { "_process_rank_one_or_two_observation": { "total": 0.06310009998647104, "count": 200, "is_parallel": true, "self": 0.06310009998647104 } } }, "UnityEnvironment.step": { "total": 6864.232715099248, "count": 346113, "is_parallel": true, "self": 377.00263039839865, "children": { "UnityEnvironment._generate_step_input": { "total": 362.9385453004808, "count": 346113, "is_parallel": true, "self": 362.9385453004808 }, "communicator.exchange": { "total": 4899.581217100371, "count": 346113, "is_parallel": true, "self": 4899.581217100371 }, "steps_from_proto": { "total": 1224.7103222999979, "count": 692226, "is_parallel": true, "self": 249.2090652003617, "children": { "_process_rank_one_or_two_observation": { "total": 975.5012570996362, "count": 2768904, "is_parallel": true, "self": 975.5012570996362 } } } } } } } } } } }, "trainer_advance": { "total": 19598.011848700895, "count": 346113, "self": 89.78092410198224, "children": { "process_trajectory": { "total": 3282.7165348989065, "count": 346113, "self": 3279.5535615989047, "children": { "RLTrainer._checkpoint": { "total": 3.162973300001795, "count": 10, "self": 3.162973300001795 } } }, "_update_policy": { "total": 16225.514389700005, "count": 241, "self": 1395.569181400042, "children": { "TorchPOCAOptimizer.update": { "total": 14829.945208299963, "count": 7239, "self": 14829.945208299963 } } } } } } }, "trainer_threads": { "total": 1.2000018614344299e-06, "count": 1, "self": 1.2000018614344299e-06 }, "TrainerController._save_models": { "total": 0.6200399000008474, "count": 1, "self": 0.3289555000010296, "children": { "RLTrainer._checkpoint": { "total": 0.29108439999981783, "count": 1, "self": 0.29108439999981783 } } } } } } }