|
{ |
|
"name": "root", |
|
"gauges": { |
|
"SoccerTwos.Policy.Entropy.mean": { |
|
"value": 1.4070029258728027, |
|
"min": 1.364182472229004, |
|
"max": 3.2957570552825928, |
|
"count": 2251 |
|
}, |
|
"SoccerTwos.Policy.Entropy.sum": { |
|
"value": 27824.890625, |
|
"min": 14507.8642578125, |
|
"max": 105464.2265625, |
|
"count": 2251 |
|
}, |
|
"SoccerTwos.Environment.EpisodeLength.mean": { |
|
"value": 49.7979797979798, |
|
"min": 40.31147540983606, |
|
"max": 999.0, |
|
"count": 2251 |
|
}, |
|
"SoccerTwos.Environment.EpisodeLength.sum": { |
|
"value": 19720.0, |
|
"min": 13332.0, |
|
"max": 28468.0, |
|
"count": 2251 |
|
}, |
|
"SoccerTwos.Self-play.ELO.mean": { |
|
"value": 1550.0245450575744, |
|
"min": 1190.0487814065316, |
|
"max": 1641.0483088367112, |
|
"count": 2246 |
|
}, |
|
"SoccerTwos.Self-play.ELO.sum": { |
|
"value": 306904.85992139974, |
|
"min": 2385.9431164520465, |
|
"max": 388701.1363259206, |
|
"count": 2246 |
|
}, |
|
"SoccerTwos.Step.mean": { |
|
"value": 22509878.0, |
|
"min": 9250.0, |
|
"max": 22509878.0, |
|
"count": 2251 |
|
}, |
|
"SoccerTwos.Step.sum": { |
|
"value": 22509878.0, |
|
"min": 9250.0, |
|
"max": 22509878.0, |
|
"count": 2251 |
|
}, |
|
"SoccerTwos.Policy.ExtrinsicBaselineEstimate.mean": { |
|
"value": 0.028588376939296722, |
|
"min": -0.14516468346118927, |
|
"max": 0.22160297632217407, |
|
"count": 2251 |
|
}, |
|
"SoccerTwos.Policy.ExtrinsicBaselineEstimate.sum": { |
|
"value": 5.66049861907959, |
|
"min": -26.064918518066406, |
|
"max": 33.42010498046875, |
|
"count": 2251 |
|
}, |
|
"SoccerTwos.Policy.ExtrinsicValueEstimate.mean": { |
|
"value": 0.02912515588104725, |
|
"min": -0.14482811093330383, |
|
"max": 0.21980521082878113, |
|
"count": 2251 |
|
}, |
|
"SoccerTwos.Policy.ExtrinsicValueEstimate.sum": { |
|
"value": 5.766780853271484, |
|
"min": -27.210805892944336, |
|
"max": 34.05256652832031, |
|
"count": 2251 |
|
}, |
|
"SoccerTwos.Environment.CumulativeReward.mean": { |
|
"value": 0.0, |
|
"min": 0.0, |
|
"max": 0.0, |
|
"count": 2251 |
|
}, |
|
"SoccerTwos.Environment.CumulativeReward.sum": { |
|
"value": 0.0, |
|
"min": 0.0, |
|
"max": 0.0, |
|
"count": 2251 |
|
}, |
|
"SoccerTwos.Policy.ExtrinsicReward.mean": { |
|
"value": 0.1643575755032626, |
|
"min": -0.6405809518127215, |
|
"max": 0.5064571443058196, |
|
"count": 2251 |
|
}, |
|
"SoccerTwos.Policy.ExtrinsicReward.sum": { |
|
"value": 32.542799949645996, |
|
"min": -65.78759974241257, |
|
"max": 66.88839983940125, |
|
"count": 2251 |
|
}, |
|
"SoccerTwos.Environment.GroupCumulativeReward.mean": { |
|
"value": 0.1643575755032626, |
|
"min": -0.6405809518127215, |
|
"max": 0.5064571443058196, |
|
"count": 2251 |
|
}, |
|
"SoccerTwos.Environment.GroupCumulativeReward.sum": { |
|
"value": 32.542799949645996, |
|
"min": -65.78759974241257, |
|
"max": 66.88839983940125, |
|
"count": 2251 |
|
}, |
|
"SoccerTwos.IsTraining.mean": { |
|
"value": 1.0, |
|
"min": 1.0, |
|
"max": 1.0, |
|
"count": 2251 |
|
}, |
|
"SoccerTwos.IsTraining.sum": { |
|
"value": 1.0, |
|
"min": 1.0, |
|
"max": 1.0, |
|
"count": 2251 |
|
}, |
|
"SoccerTwos.Losses.PolicyLoss.mean": { |
|
"value": 0.01851427239695719, |
|
"min": 0.010531172272749245, |
|
"max": 0.02492763645859668, |
|
"count": 1091 |
|
}, |
|
"SoccerTwos.Losses.PolicyLoss.sum": { |
|
"value": 0.01851427239695719, |
|
"min": 0.010531172272749245, |
|
"max": 0.02492763645859668, |
|
"count": 1091 |
|
}, |
|
"SoccerTwos.Losses.ValueLoss.mean": { |
|
"value": 0.10829064498345058, |
|
"min": 0.0010078916025425618, |
|
"max": 0.1292997161547343, |
|
"count": 1091 |
|
}, |
|
"SoccerTwos.Losses.ValueLoss.sum": { |
|
"value": 0.10829064498345058, |
|
"min": 0.0010078916025425618, |
|
"max": 0.1292997161547343, |
|
"count": 1091 |
|
}, |
|
"SoccerTwos.Losses.BaselineLoss.mean": { |
|
"value": 0.11002712522943815, |
|
"min": 0.0010057883948320523, |
|
"max": 0.13142008284727733, |
|
"count": 1091 |
|
}, |
|
"SoccerTwos.Losses.BaselineLoss.sum": { |
|
"value": 0.11002712522943815, |
|
"min": 0.0010057883948320523, |
|
"max": 0.13142008284727733, |
|
"count": 1091 |
|
}, |
|
"SoccerTwos.Policy.LearningRate.mean": { |
|
"value": 0.0003, |
|
"min": 0.0003, |
|
"max": 0.0003, |
|
"count": 1091 |
|
}, |
|
"SoccerTwos.Policy.LearningRate.sum": { |
|
"value": 0.0003, |
|
"min": 0.0003, |
|
"max": 0.0003, |
|
"count": 1091 |
|
}, |
|
"SoccerTwos.Policy.Epsilon.mean": { |
|
"value": 0.20000000000000007, |
|
"min": 0.2, |
|
"max": 0.20000000000000007, |
|
"count": 1091 |
|
}, |
|
"SoccerTwos.Policy.Epsilon.sum": { |
|
"value": 0.20000000000000007, |
|
"min": 0.2, |
|
"max": 0.20000000000000007, |
|
"count": 1091 |
|
}, |
|
"SoccerTwos.Policy.Beta.mean": { |
|
"value": 0.005000000000000001, |
|
"min": 0.005, |
|
"max": 0.005000000000000001, |
|
"count": 1091 |
|
}, |
|
"SoccerTwos.Policy.Beta.sum": { |
|
"value": 0.005000000000000001, |
|
"min": 0.005, |
|
"max": 0.005000000000000001, |
|
"count": 1091 |
|
} |
|
}, |
|
"metadata": { |
|
"timer_format_version": "0.1.0", |
|
"start_time_seconds": "1675332665", |
|
"python_version": "3.8.16 (default, Jan 17 2023, 23:13:24) \n[GCC 11.2.0]", |
|
"command_line_arguments": "/home/antoine/anaconda3/envs/hf_drl_unit7/bin/mlagents-learn ./ml-agents/config/poca/SoccerTwos.yaml --env=./SoccerTwos/SoccerTwos.x86_64 --run-id=SoccerTwos_1 --no-graphics", |
|
"mlagents_version": "0.31.0.dev0", |
|
"mlagents_envs_version": "0.31.0.dev0", |
|
"communication_protocol_version": "1.5.0", |
|
"pytorch_version": "1.8.1+cu102", |
|
"numpy_version": "1.21.2", |
|
"end_time_seconds": "1675364819" |
|
}, |
|
"total": 32154.188953462, |
|
"count": 1, |
|
"self": 0.1803494279993174, |
|
"children": { |
|
"run_training.setup": { |
|
"total": 0.00640905700129224, |
|
"count": 1, |
|
"self": 0.00640905700129224 |
|
}, |
|
"TrainerController.start_learning": { |
|
"total": 32154.002194976998, |
|
"count": 1, |
|
"self": 22.474659589188377, |
|
"children": { |
|
"TrainerController._reset_env": { |
|
"total": 4.29831169298086, |
|
"count": 113, |
|
"self": 4.29831169298086 |
|
}, |
|
"TrainerController.advance": { |
|
"total": 32127.09101790282, |
|
"count": 1562426, |
|
"self": 20.422603639017325, |
|
"children": { |
|
"env_step": { |
|
"total": 24643.542619113483, |
|
"count": 1562426, |
|
"self": 19942.420775126586, |
|
"children": { |
|
"SubprocessEnvManager._take_step": { |
|
"total": 4686.904853418628, |
|
"count": 1562426, |
|
"self": 111.88414057251794, |
|
"children": { |
|
"TorchPolicy.evaluate": { |
|
"total": 4575.02071284611, |
|
"count": 2828472, |
|
"self": 4575.02071284611 |
|
} |
|
} |
|
}, |
|
"workers": { |
|
"total": 14.216990568267647, |
|
"count": 1562425, |
|
"self": 0.0, |
|
"children": { |
|
"worker_root": { |
|
"total": 32115.610743571782, |
|
"count": 1562425, |
|
"is_parallel": true, |
|
"self": 14869.433992172224, |
|
"children": { |
|
"run_training.setup": { |
|
"total": 0.0, |
|
"count": 0, |
|
"is_parallel": true, |
|
"self": 0.0, |
|
"children": { |
|
"steps_from_proto": { |
|
"total": 0.0017130690011981642, |
|
"count": 2, |
|
"is_parallel": true, |
|
"self": 0.00035320399911142886, |
|
"children": { |
|
"_process_rank_one_or_two_observation": { |
|
"total": 0.0013598650020867353, |
|
"count": 8, |
|
"is_parallel": true, |
|
"self": 0.0013598650020867353 |
|
} |
|
} |
|
}, |
|
"UnityEnvironment.step": { |
|
"total": 0.020998721000069054, |
|
"count": 1, |
|
"is_parallel": true, |
|
"self": 0.0009554309981467668, |
|
"children": { |
|
"UnityEnvironment._generate_step_input": { |
|
"total": 0.0006709480003337376, |
|
"count": 1, |
|
"is_parallel": true, |
|
"self": 0.0006709480003337376 |
|
}, |
|
"communicator.exchange": { |
|
"total": 0.016712819000531454, |
|
"count": 1, |
|
"is_parallel": true, |
|
"self": 0.016712819000531454 |
|
}, |
|
"steps_from_proto": { |
|
"total": 0.002659523001057096, |
|
"count": 2, |
|
"is_parallel": true, |
|
"self": 0.00043291599831718486, |
|
"children": { |
|
"_process_rank_one_or_two_observation": { |
|
"total": 0.002226607002739911, |
|
"count": 8, |
|
"is_parallel": true, |
|
"self": 0.002226607002739911 |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
}, |
|
"UnityEnvironment.step": { |
|
"total": 17245.90504891357, |
|
"count": 1562424, |
|
"is_parallel": true, |
|
"self": 1198.7301085013478, |
|
"children": { |
|
"UnityEnvironment._generate_step_input": { |
|
"total": 786.7526528414492, |
|
"count": 1562424, |
|
"is_parallel": true, |
|
"self": 786.7526528414492 |
|
}, |
|
"communicator.exchange": { |
|
"total": 11804.459724711165, |
|
"count": 1562424, |
|
"is_parallel": true, |
|
"self": 11804.459724711165 |
|
}, |
|
"steps_from_proto": { |
|
"total": 3455.9625628596077, |
|
"count": 3124848, |
|
"is_parallel": true, |
|
"self": 519.3835088980377, |
|
"children": { |
|
"_process_rank_one_or_two_observation": { |
|
"total": 2936.57905396157, |
|
"count": 12499392, |
|
"is_parallel": true, |
|
"self": 2936.57905396157 |
|
} |
|
} |
|
} |
|
} |
|
}, |
|
"steps_from_proto": { |
|
"total": 0.27170248599031765, |
|
"count": 224, |
|
"is_parallel": true, |
|
"self": 0.03974755697345245, |
|
"children": { |
|
"_process_rank_one_or_two_observation": { |
|
"total": 0.2319549290168652, |
|
"count": 896, |
|
"is_parallel": true, |
|
"self": 0.2319549290168652 |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
}, |
|
"trainer_advance": { |
|
"total": 7463.125795150323, |
|
"count": 1562425, |
|
"self": 156.0927741749765, |
|
"children": { |
|
"process_trajectory": { |
|
"total": 3043.756003937433, |
|
"count": 1562425, |
|
"self": 3037.450239336422, |
|
"children": { |
|
"RLTrainer._checkpoint": { |
|
"total": 6.305764601011106, |
|
"count": 45, |
|
"self": 6.305764601011106 |
|
} |
|
} |
|
}, |
|
"_update_policy": { |
|
"total": 4263.2770170379135, |
|
"count": 1092, |
|
"self": 2639.284905304594, |
|
"children": { |
|
"TorchPOCAOptimizer.update": { |
|
"total": 1623.9921117333197, |
|
"count": 32763, |
|
"self": 1623.9921117333197 |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
}, |
|
"trainer_threads": { |
|
"total": 6.400005077011883e-07, |
|
"count": 1, |
|
"self": 6.400005077011883e-07 |
|
}, |
|
"TrainerController._save_models": { |
|
"total": 0.1382051520049572, |
|
"count": 1, |
|
"self": 0.0012712670068140142, |
|
"children": { |
|
"RLTrainer._checkpoint": { |
|
"total": 0.13693388499814318, |
|
"count": 1, |
|
"self": 0.13693388499814318 |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |