poca-SoccerTwos / run_logs /timers.json
candrews1971's picture
50Million
1d4cb64 verified
{
"name": "root",
"gauges": {
"SoccerTwos.Policy.Entropy.mean": {
"value": 0.9085261225700378,
"min": 0.900277316570282,
"max": 3.29008150100708,
"count": 3700
},
"SoccerTwos.Policy.Entropy.sum": {
"value": 17501.84765625,
"min": 14925.09375,
"max": 105282.609375,
"count": 3700
},
"SoccerTwos.Environment.EpisodeLength.mean": {
"value": 72.75,
"min": 50.422680412371136,
"max": 999.0,
"count": 3700
},
"SoccerTwos.Environment.EpisodeLength.sum": {
"value": 19788.0,
"min": 7992.0,
"max": 31936.0,
"count": 3700
},
"SoccerTwos.IsTraining.mean": {
"value": 1.0,
"min": 1.0,
"max": 1.0,
"count": 3701
},
"SoccerTwos.IsTraining.sum": {
"value": 1.0,
"min": 1.0,
"max": 1.0,
"count": 3701
},
"SoccerTwos.Step.mean": {
"value": 49999990.0,
"min": 13009988.0,
"max": 49999990.0,
"count": 3700
},
"SoccerTwos.Step.sum": {
"value": 49999990.0,
"min": 13009988.0,
"max": 49999990.0,
"count": 3700
},
"SoccerTwos.Policy.ExtrinsicBaselineEstimate.mean": {
"value": -0.020666854456067085,
"min": -0.18262770771980286,
"max": 0.3022185266017914,
"count": 3700
},
"SoccerTwos.Policy.ExtrinsicBaselineEstimate.sum": {
"value": -2.810692310333252,
"min": -23.04550552368164,
"max": 30.200801849365234,
"count": 3700
},
"SoccerTwos.Policy.ExtrinsicValueEstimate.mean": {
"value": -0.020067332312464714,
"min": -0.18312671780586243,
"max": 0.30087995529174805,
"count": 3700
},
"SoccerTwos.Policy.ExtrinsicValueEstimate.sum": {
"value": -2.7291572093963623,
"min": -22.754257202148438,
"max": 30.499494552612305,
"count": 3700
},
"SoccerTwos.Environment.CumulativeReward.mean": {
"value": 0.0,
"min": 0.0,
"max": 0.0,
"count": 3700
},
"SoccerTwos.Environment.CumulativeReward.sum": {
"value": 0.0,
"min": 0.0,
"max": 0.0,
"count": 3700
},
"SoccerTwos.Policy.ExtrinsicReward.mean": {
"value": -0.12077352842863869,
"min": -0.4557133336861928,
"max": 0.5597831369882607,
"count": 3700
},
"SoccerTwos.Policy.ExtrinsicReward.sum": {
"value": -16.42519986629486,
"min": -54.68560004234314,
"max": 46.9363996386528,
"count": 3700
},
"SoccerTwos.Environment.GroupCumulativeReward.mean": {
"value": -0.12077352842863869,
"min": -0.4557133336861928,
"max": 0.5597831369882607,
"count": 3700
},
"SoccerTwos.Environment.GroupCumulativeReward.sum": {
"value": -16.42519986629486,
"min": -54.68560004234314,
"max": 46.9363996386528,
"count": 3700
},
"SoccerTwos.Self-play.ELO.mean": {
"value": 1762.2704252584133,
"min": 1199.9971506578554,
"max": 1807.2337574364283,
"count": 3697
},
"SoccerTwos.Self-play.ELO.sum": {
"value": 239668.7778351442,
"min": 2403.487199768784,
"max": 345797.03797725256,
"count": 3697
},
"SoccerTwos.Losses.PolicyLoss.mean": {
"value": 0.015397342308036362,
"min": 0.011067466323099021,
"max": 0.03322836385729412,
"count": 1793
},
"SoccerTwos.Losses.PolicyLoss.sum": {
"value": 0.015397342308036362,
"min": 0.011067466323099021,
"max": 0.03322836385729412,
"count": 1793
},
"SoccerTwos.Losses.ValueLoss.mean": {
"value": 0.12179502000411352,
"min": 0.0008780070677554856,
"max": 0.1353025034070015,
"count": 1793
},
"SoccerTwos.Losses.ValueLoss.sum": {
"value": 0.12179502000411352,
"min": 0.0008780070677554856,
"max": 0.1353025034070015,
"count": 1793
},
"SoccerTwos.Losses.BaselineLoss.mean": {
"value": 0.12190080806612968,
"min": 0.0010242766661879917,
"max": 0.13573680569728216,
"count": 1793
},
"SoccerTwos.Losses.BaselineLoss.sum": {
"value": 0.12190080806612968,
"min": 0.0010242766661879917,
"max": 0.13573680569728216,
"count": 1793
},
"SoccerTwos.Policy.LearningRate.mean": {
"value": 7.555998921999384e-08,
"min": 7.555998921999384e-08,
"max": 0.0005176344860522198,
"count": 1793
},
"SoccerTwos.Policy.LearningRate.sum": {
"value": 7.555998921999384e-08,
"min": 7.555998921999384e-08,
"max": 0.0005176344860522198,
"count": 1793
},
"SoccerTwos.Policy.Epsilon.mean": {
"value": 0.10001077999999998,
"min": 0.10001077999999998,
"max": 0.17394777999999997,
"count": 1793
},
"SoccerTwos.Policy.Epsilon.sum": {
"value": 0.10001077999999998,
"min": 0.10001077999999998,
"max": 0.17394777999999997,
"count": 1793
},
"SoccerTwos.Policy.Beta.mean": {
"value": 1.053792199999996e-05,
"min": 1.053792199999996e-05,
"max": 0.0036999942220000016,
"count": 1793
},
"SoccerTwos.Policy.Beta.sum": {
"value": 1.053792199999996e-05,
"min": 1.053792199999996e-05,
"max": 0.0036999942220000016,
"count": 1793
}
},
"metadata": {
"timer_format_version": "0.1.0",
"start_time_seconds": "1718202104",
"python_version": "3.10.12 (main, Jul 5 2023, 18:54:27) [GCC 11.2.0]",
"command_line_arguments": "/home/candrews/anaconda3/envs/rl/bin/mlagents-learn results/SoccerTwos/configuration.yaml --run-id=SoccerTwos --resume",
"mlagents_version": "1.0.0",
"mlagents_envs_version": "1.0.0",
"communication_protocol_version": "1.5.0",
"pytorch_version": "2.3.1+cu121",
"numpy_version": "1.21.2",
"end_time_seconds": "1718291544"
},
"total": 89439.655143559,
"count": 1,
"self": 0.12202233797870576,
"children": {
"run_training.setup": {
"total": 0.016299434000757174,
"count": 1,
"self": 0.016299434000757174
},
"TrainerController.start_learning": {
"total": 89439.51682178701,
"count": 1,
"self": 48.225265316374134,
"children": {
"TrainerController._reset_env": {
"total": 5.392195741071191,
"count": 186,
"self": 5.392195741071191
},
"TrainerController.advance": {
"total": 89385.65861405357,
"count": 2504281,
"self": 43.67091076684301,
"children": {
"env_step": {
"total": 72551.5218888928,
"count": 2504281,
"self": 48862.6198433862,
"children": {
"SubprocessEnvManager._take_step": {
"total": 23658.219093947908,
"count": 2504281,
"self": 324.338922350933,
"children": {
"TorchPolicy.evaluate": {
"total": 23333.880171596975,
"count": 4648782,
"self": 23333.880171596975
}
}
},
"workers": {
"total": 30.682951558695095,
"count": 2504281,
"self": 0.0,
"children": {
"worker_root": {
"total": 89322.32348160779,
"count": 2504281,
"is_parallel": true,
"self": 45938.6905439756,
"children": {
"run_training.setup": {
"total": 0.0,
"count": 0,
"is_parallel": true,
"self": 0.0,
"children": {
"steps_from_proto": {
"total": 0.002996798999447492,
"count": 2,
"is_parallel": true,
"self": 0.0012141010010964237,
"children": {
"_process_rank_one_or_two_observation": {
"total": 0.0017826979983510682,
"count": 8,
"is_parallel": true,
"self": 0.0017826979983510682
}
}
},
"UnityEnvironment.step": {
"total": 0.03301058000033663,
"count": 1,
"is_parallel": true,
"self": 0.0005553990004045772,
"children": {
"UnityEnvironment._generate_step_input": {
"total": 0.00037568999960058136,
"count": 1,
"is_parallel": true,
"self": 0.00037568999960058136
},
"communicator.exchange": {
"total": 0.030290142000012565,
"count": 1,
"is_parallel": true,
"self": 0.030290142000012565
},
"steps_from_proto": {
"total": 0.0017893490003189072,
"count": 2,
"is_parallel": true,
"self": 0.00037193900061538443,
"children": {
"_process_rank_one_or_two_observation": {
"total": 0.0014174099997035228,
"count": 8,
"is_parallel": true,
"self": 0.0014174099997035228
}
}
}
}
}
}
},
"steps_from_proto": {
"total": 0.3447280409091036,
"count": 370,
"is_parallel": true,
"self": 0.06514130008235952,
"children": {
"_process_rank_one_or_two_observation": {
"total": 0.27958674082674406,
"count": 1480,
"is_parallel": true,
"self": 0.27958674082674406
}
}
},
"UnityEnvironment.step": {
"total": 43383.28820959128,
"count": 2504280,
"is_parallel": true,
"self": 1448.4682002114132,
"children": {
"UnityEnvironment._generate_step_input": {
"total": 932.0408725699708,
"count": 2504280,
"is_parallel": true,
"self": 932.0408725699708
},
"communicator.exchange": {
"total": 36480.94365370879,
"count": 2504280,
"is_parallel": true,
"self": 36480.94365370879
},
"steps_from_proto": {
"total": 4521.83548310111,
"count": 5008560,
"is_parallel": true,
"self": 864.9375246691716,
"children": {
"_process_rank_one_or_two_observation": {
"total": 3656.8979584319386,
"count": 20034240,
"is_parallel": true,
"self": 3656.8979584319386
}
}
}
}
}
}
}
}
}
}
},
"trainer_advance": {
"total": 16790.465814393916,
"count": 2504281,
"self": 389.440108310886,
"children": {
"process_trajectory": {
"total": 8186.032770570991,
"count": 2504281,
"self": 8163.696337590989,
"children": {
"RLTrainer._checkpoint": {
"total": 22.33643298000152,
"count": 75,
"self": 22.33643298000152
}
}
},
"_update_policy": {
"total": 8214.99293551204,
"count": 1793,
"self": 5104.453318782099,
"children": {
"TorchPOCAOptimizer.update": {
"total": 3110.5396167299414,
"count": 53796,
"self": 3110.5396167299414
}
}
}
}
}
}
},
"trainer_threads": {
"total": 7.199996616691351e-07,
"count": 1,
"self": 7.199996616691351e-07
},
"TrainerController._save_models": {
"total": 0.24074595600541215,
"count": 1,
"self": 0.0033287870028289035,
"children": {
"RLTrainer._checkpoint": {
"total": 0.23741716900258325,
"count": 1,
"self": 0.23741716900258325
}
}
}
}
}
}
}