|
{ |
|
"name": "root", |
|
"gauges": { |
|
"SoccerTwos.Policy.Entropy.mean": { |
|
"value": 0.9085261225700378, |
|
"min": 0.900277316570282, |
|
"max": 3.29008150100708, |
|
"count": 3700 |
|
}, |
|
"SoccerTwos.Policy.Entropy.sum": { |
|
"value": 17501.84765625, |
|
"min": 14925.09375, |
|
"max": 105282.609375, |
|
"count": 3700 |
|
}, |
|
"SoccerTwos.Environment.EpisodeLength.mean": { |
|
"value": 72.75, |
|
"min": 50.422680412371136, |
|
"max": 999.0, |
|
"count": 3700 |
|
}, |
|
"SoccerTwos.Environment.EpisodeLength.sum": { |
|
"value": 19788.0, |
|
"min": 7992.0, |
|
"max": 31936.0, |
|
"count": 3700 |
|
}, |
|
"SoccerTwos.IsTraining.mean": { |
|
"value": 1.0, |
|
"min": 1.0, |
|
"max": 1.0, |
|
"count": 3701 |
|
}, |
|
"SoccerTwos.IsTraining.sum": { |
|
"value": 1.0, |
|
"min": 1.0, |
|
"max": 1.0, |
|
"count": 3701 |
|
}, |
|
"SoccerTwos.Step.mean": { |
|
"value": 49999990.0, |
|
"min": 13009988.0, |
|
"max": 49999990.0, |
|
"count": 3700 |
|
}, |
|
"SoccerTwos.Step.sum": { |
|
"value": 49999990.0, |
|
"min": 13009988.0, |
|
"max": 49999990.0, |
|
"count": 3700 |
|
}, |
|
"SoccerTwos.Policy.ExtrinsicBaselineEstimate.mean": { |
|
"value": -0.020666854456067085, |
|
"min": -0.18262770771980286, |
|
"max": 0.3022185266017914, |
|
"count": 3700 |
|
}, |
|
"SoccerTwos.Policy.ExtrinsicBaselineEstimate.sum": { |
|
"value": -2.810692310333252, |
|
"min": -23.04550552368164, |
|
"max": 30.200801849365234, |
|
"count": 3700 |
|
}, |
|
"SoccerTwos.Policy.ExtrinsicValueEstimate.mean": { |
|
"value": -0.020067332312464714, |
|
"min": -0.18312671780586243, |
|
"max": 0.30087995529174805, |
|
"count": 3700 |
|
}, |
|
"SoccerTwos.Policy.ExtrinsicValueEstimate.sum": { |
|
"value": -2.7291572093963623, |
|
"min": -22.754257202148438, |
|
"max": 30.499494552612305, |
|
"count": 3700 |
|
}, |
|
"SoccerTwos.Environment.CumulativeReward.mean": { |
|
"value": 0.0, |
|
"min": 0.0, |
|
"max": 0.0, |
|
"count": 3700 |
|
}, |
|
"SoccerTwos.Environment.CumulativeReward.sum": { |
|
"value": 0.0, |
|
"min": 0.0, |
|
"max": 0.0, |
|
"count": 3700 |
|
}, |
|
"SoccerTwos.Policy.ExtrinsicReward.mean": { |
|
"value": -0.12077352842863869, |
|
"min": -0.4557133336861928, |
|
"max": 0.5597831369882607, |
|
"count": 3700 |
|
}, |
|
"SoccerTwos.Policy.ExtrinsicReward.sum": { |
|
"value": -16.42519986629486, |
|
"min": -54.68560004234314, |
|
"max": 46.9363996386528, |
|
"count": 3700 |
|
}, |
|
"SoccerTwos.Environment.GroupCumulativeReward.mean": { |
|
"value": -0.12077352842863869, |
|
"min": -0.4557133336861928, |
|
"max": 0.5597831369882607, |
|
"count": 3700 |
|
}, |
|
"SoccerTwos.Environment.GroupCumulativeReward.sum": { |
|
"value": -16.42519986629486, |
|
"min": -54.68560004234314, |
|
"max": 46.9363996386528, |
|
"count": 3700 |
|
}, |
|
"SoccerTwos.Self-play.ELO.mean": { |
|
"value": 1762.2704252584133, |
|
"min": 1199.9971506578554, |
|
"max": 1807.2337574364283, |
|
"count": 3697 |
|
}, |
|
"SoccerTwos.Self-play.ELO.sum": { |
|
"value": 239668.7778351442, |
|
"min": 2403.487199768784, |
|
"max": 345797.03797725256, |
|
"count": 3697 |
|
}, |
|
"SoccerTwos.Losses.PolicyLoss.mean": { |
|
"value": 0.015397342308036362, |
|
"min": 0.011067466323099021, |
|
"max": 0.03322836385729412, |
|
"count": 1793 |
|
}, |
|
"SoccerTwos.Losses.PolicyLoss.sum": { |
|
"value": 0.015397342308036362, |
|
"min": 0.011067466323099021, |
|
"max": 0.03322836385729412, |
|
"count": 1793 |
|
}, |
|
"SoccerTwos.Losses.ValueLoss.mean": { |
|
"value": 0.12179502000411352, |
|
"min": 0.0008780070677554856, |
|
"max": 0.1353025034070015, |
|
"count": 1793 |
|
}, |
|
"SoccerTwos.Losses.ValueLoss.sum": { |
|
"value": 0.12179502000411352, |
|
"min": 0.0008780070677554856, |
|
"max": 0.1353025034070015, |
|
"count": 1793 |
|
}, |
|
"SoccerTwos.Losses.BaselineLoss.mean": { |
|
"value": 0.12190080806612968, |
|
"min": 0.0010242766661879917, |
|
"max": 0.13573680569728216, |
|
"count": 1793 |
|
}, |
|
"SoccerTwos.Losses.BaselineLoss.sum": { |
|
"value": 0.12190080806612968, |
|
"min": 0.0010242766661879917, |
|
"max": 0.13573680569728216, |
|
"count": 1793 |
|
}, |
|
"SoccerTwos.Policy.LearningRate.mean": { |
|
"value": 7.555998921999384e-08, |
|
"min": 7.555998921999384e-08, |
|
"max": 0.0005176344860522198, |
|
"count": 1793 |
|
}, |
|
"SoccerTwos.Policy.LearningRate.sum": { |
|
"value": 7.555998921999384e-08, |
|
"min": 7.555998921999384e-08, |
|
"max": 0.0005176344860522198, |
|
"count": 1793 |
|
}, |
|
"SoccerTwos.Policy.Epsilon.mean": { |
|
"value": 0.10001077999999998, |
|
"min": 0.10001077999999998, |
|
"max": 0.17394777999999997, |
|
"count": 1793 |
|
}, |
|
"SoccerTwos.Policy.Epsilon.sum": { |
|
"value": 0.10001077999999998, |
|
"min": 0.10001077999999998, |
|
"max": 0.17394777999999997, |
|
"count": 1793 |
|
}, |
|
"SoccerTwos.Policy.Beta.mean": { |
|
"value": 1.053792199999996e-05, |
|
"min": 1.053792199999996e-05, |
|
"max": 0.0036999942220000016, |
|
"count": 1793 |
|
}, |
|
"SoccerTwos.Policy.Beta.sum": { |
|
"value": 1.053792199999996e-05, |
|
"min": 1.053792199999996e-05, |
|
"max": 0.0036999942220000016, |
|
"count": 1793 |
|
} |
|
}, |
|
"metadata": { |
|
"timer_format_version": "0.1.0", |
|
"start_time_seconds": "1718202104", |
|
"python_version": "3.10.12 (main, Jul 5 2023, 18:54:27) [GCC 11.2.0]", |
|
"command_line_arguments": "/home/candrews/anaconda3/envs/rl/bin/mlagents-learn results/SoccerTwos/configuration.yaml --run-id=SoccerTwos --resume", |
|
"mlagents_version": "1.0.0", |
|
"mlagents_envs_version": "1.0.0", |
|
"communication_protocol_version": "1.5.0", |
|
"pytorch_version": "2.3.1+cu121", |
|
"numpy_version": "1.21.2", |
|
"end_time_seconds": "1718291544" |
|
}, |
|
"total": 89439.655143559, |
|
"count": 1, |
|
"self": 0.12202233797870576, |
|
"children": { |
|
"run_training.setup": { |
|
"total": 0.016299434000757174, |
|
"count": 1, |
|
"self": 0.016299434000757174 |
|
}, |
|
"TrainerController.start_learning": { |
|
"total": 89439.51682178701, |
|
"count": 1, |
|
"self": 48.225265316374134, |
|
"children": { |
|
"TrainerController._reset_env": { |
|
"total": 5.392195741071191, |
|
"count": 186, |
|
"self": 5.392195741071191 |
|
}, |
|
"TrainerController.advance": { |
|
"total": 89385.65861405357, |
|
"count": 2504281, |
|
"self": 43.67091076684301, |
|
"children": { |
|
"env_step": { |
|
"total": 72551.5218888928, |
|
"count": 2504281, |
|
"self": 48862.6198433862, |
|
"children": { |
|
"SubprocessEnvManager._take_step": { |
|
"total": 23658.219093947908, |
|
"count": 2504281, |
|
"self": 324.338922350933, |
|
"children": { |
|
"TorchPolicy.evaluate": { |
|
"total": 23333.880171596975, |
|
"count": 4648782, |
|
"self": 23333.880171596975 |
|
} |
|
} |
|
}, |
|
"workers": { |
|
"total": 30.682951558695095, |
|
"count": 2504281, |
|
"self": 0.0, |
|
"children": { |
|
"worker_root": { |
|
"total": 89322.32348160779, |
|
"count": 2504281, |
|
"is_parallel": true, |
|
"self": 45938.6905439756, |
|
"children": { |
|
"run_training.setup": { |
|
"total": 0.0, |
|
"count": 0, |
|
"is_parallel": true, |
|
"self": 0.0, |
|
"children": { |
|
"steps_from_proto": { |
|
"total": 0.002996798999447492, |
|
"count": 2, |
|
"is_parallel": true, |
|
"self": 0.0012141010010964237, |
|
"children": { |
|
"_process_rank_one_or_two_observation": { |
|
"total": 0.0017826979983510682, |
|
"count": 8, |
|
"is_parallel": true, |
|
"self": 0.0017826979983510682 |
|
} |
|
} |
|
}, |
|
"UnityEnvironment.step": { |
|
"total": 0.03301058000033663, |
|
"count": 1, |
|
"is_parallel": true, |
|
"self": 0.0005553990004045772, |
|
"children": { |
|
"UnityEnvironment._generate_step_input": { |
|
"total": 0.00037568999960058136, |
|
"count": 1, |
|
"is_parallel": true, |
|
"self": 0.00037568999960058136 |
|
}, |
|
"communicator.exchange": { |
|
"total": 0.030290142000012565, |
|
"count": 1, |
|
"is_parallel": true, |
|
"self": 0.030290142000012565 |
|
}, |
|
"steps_from_proto": { |
|
"total": 0.0017893490003189072, |
|
"count": 2, |
|
"is_parallel": true, |
|
"self": 0.00037193900061538443, |
|
"children": { |
|
"_process_rank_one_or_two_observation": { |
|
"total": 0.0014174099997035228, |
|
"count": 8, |
|
"is_parallel": true, |
|
"self": 0.0014174099997035228 |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
}, |
|
"steps_from_proto": { |
|
"total": 0.3447280409091036, |
|
"count": 370, |
|
"is_parallel": true, |
|
"self": 0.06514130008235952, |
|
"children": { |
|
"_process_rank_one_or_two_observation": { |
|
"total": 0.27958674082674406, |
|
"count": 1480, |
|
"is_parallel": true, |
|
"self": 0.27958674082674406 |
|
} |
|
} |
|
}, |
|
"UnityEnvironment.step": { |
|
"total": 43383.28820959128, |
|
"count": 2504280, |
|
"is_parallel": true, |
|
"self": 1448.4682002114132, |
|
"children": { |
|
"UnityEnvironment._generate_step_input": { |
|
"total": 932.0408725699708, |
|
"count": 2504280, |
|
"is_parallel": true, |
|
"self": 932.0408725699708 |
|
}, |
|
"communicator.exchange": { |
|
"total": 36480.94365370879, |
|
"count": 2504280, |
|
"is_parallel": true, |
|
"self": 36480.94365370879 |
|
}, |
|
"steps_from_proto": { |
|
"total": 4521.83548310111, |
|
"count": 5008560, |
|
"is_parallel": true, |
|
"self": 864.9375246691716, |
|
"children": { |
|
"_process_rank_one_or_two_observation": { |
|
"total": 3656.8979584319386, |
|
"count": 20034240, |
|
"is_parallel": true, |
|
"self": 3656.8979584319386 |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
}, |
|
"trainer_advance": { |
|
"total": 16790.465814393916, |
|
"count": 2504281, |
|
"self": 389.440108310886, |
|
"children": { |
|
"process_trajectory": { |
|
"total": 8186.032770570991, |
|
"count": 2504281, |
|
"self": 8163.696337590989, |
|
"children": { |
|
"RLTrainer._checkpoint": { |
|
"total": 22.33643298000152, |
|
"count": 75, |
|
"self": 22.33643298000152 |
|
} |
|
} |
|
}, |
|
"_update_policy": { |
|
"total": 8214.99293551204, |
|
"count": 1793, |
|
"self": 5104.453318782099, |
|
"children": { |
|
"TorchPOCAOptimizer.update": { |
|
"total": 3110.5396167299414, |
|
"count": 53796, |
|
"self": 3110.5396167299414 |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
}, |
|
"trainer_threads": { |
|
"total": 7.199996616691351e-07, |
|
"count": 1, |
|
"self": 7.199996616691351e-07 |
|
}, |
|
"TrainerController._save_models": { |
|
"total": 0.24074595600541215, |
|
"count": 1, |
|
"self": 0.0033287870028289035, |
|
"children": { |
|
"RLTrainer._checkpoint": { |
|
"total": 0.23741716900258325, |
|
"count": 1, |
|
"self": 0.23741716900258325 |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |