|
{ |
|
"name": "root", |
|
"gauges": { |
|
"SoccerTwos.Policy.Entropy.mean": { |
|
"value": 2.0180764198303223, |
|
"min": 1.9686380624771118, |
|
"max": 3.29573130607605, |
|
"count": 500 |
|
}, |
|
"SoccerTwos.Policy.Entropy.sum": { |
|
"value": 40942.734375, |
|
"min": 23230.611328125, |
|
"max": 127156.0390625, |
|
"count": 500 |
|
}, |
|
"SoccerTwos.Environment.EpisodeLength.mean": { |
|
"value": 57.773809523809526, |
|
"min": 46.25471698113208, |
|
"max": 999.0, |
|
"count": 500 |
|
}, |
|
"SoccerTwos.Environment.EpisodeLength.sum": { |
|
"value": 19412.0, |
|
"min": 16304.0, |
|
"max": 24372.0, |
|
"count": 500 |
|
}, |
|
"SoccerTwos.Self-play.ELO.mean": { |
|
"value": 1606.7540705210154, |
|
"min": 1194.1876210015298, |
|
"max": 1606.7540705210154, |
|
"count": 483 |
|
}, |
|
"SoccerTwos.Self-play.ELO.sum": { |
|
"value": 269934.68384753057, |
|
"min": 2392.4361146861966, |
|
"max": 320537.73161546723, |
|
"count": 483 |
|
}, |
|
"SoccerTwos.Step.mean": { |
|
"value": 4999988.0, |
|
"min": 9206.0, |
|
"max": 4999988.0, |
|
"count": 500 |
|
}, |
|
"SoccerTwos.Step.sum": { |
|
"value": 4999988.0, |
|
"min": 9206.0, |
|
"max": 4999988.0, |
|
"count": 500 |
|
}, |
|
"SoccerTwos.Policy.ExtrinsicBaselineEstimate.mean": { |
|
"value": 0.08221761882305145, |
|
"min": -0.16408230364322662, |
|
"max": 0.22671149671077728, |
|
"count": 500 |
|
}, |
|
"SoccerTwos.Policy.ExtrinsicBaselineEstimate.sum": { |
|
"value": 13.812560081481934, |
|
"min": -29.04256820678711, |
|
"max": 28.614913940429688, |
|
"count": 500 |
|
}, |
|
"SoccerTwos.Policy.ExtrinsicValueEstimate.mean": { |
|
"value": 0.081489697098732, |
|
"min": -0.16812725365161896, |
|
"max": 0.22300933301448822, |
|
"count": 500 |
|
}, |
|
"SoccerTwos.Policy.ExtrinsicValueEstimate.sum": { |
|
"value": 13.690268516540527, |
|
"min": -29.75852394104004, |
|
"max": 29.2299747467041, |
|
"count": 500 |
|
}, |
|
"SoccerTwos.Environment.CumulativeReward.mean": { |
|
"value": 0.0, |
|
"min": 0.0, |
|
"max": 0.0, |
|
"count": 500 |
|
}, |
|
"SoccerTwos.Environment.CumulativeReward.sum": { |
|
"value": 0.0, |
|
"min": 0.0, |
|
"max": 0.0, |
|
"count": 500 |
|
}, |
|
"SoccerTwos.Policy.ExtrinsicReward.mean": { |
|
"value": 0.17836428469135648, |
|
"min": -0.5160571421895709, |
|
"max": 0.5442823518725003, |
|
"count": 500 |
|
}, |
|
"SoccerTwos.Policy.ExtrinsicReward.sum": { |
|
"value": 29.965199828147888, |
|
"min": -62.956199645996094, |
|
"max": 55.29199993610382, |
|
"count": 500 |
|
}, |
|
"SoccerTwos.Environment.GroupCumulativeReward.mean": { |
|
"value": 0.17836428469135648, |
|
"min": -0.5160571421895709, |
|
"max": 0.5442823518725003, |
|
"count": 500 |
|
}, |
|
"SoccerTwos.Environment.GroupCumulativeReward.sum": { |
|
"value": 29.965199828147888, |
|
"min": -62.956199645996094, |
|
"max": 55.29199993610382, |
|
"count": 500 |
|
}, |
|
"SoccerTwos.IsTraining.mean": { |
|
"value": 1.0, |
|
"min": 1.0, |
|
"max": 1.0, |
|
"count": 500 |
|
}, |
|
"SoccerTwos.IsTraining.sum": { |
|
"value": 1.0, |
|
"min": 1.0, |
|
"max": 1.0, |
|
"count": 500 |
|
}, |
|
"SoccerTwos.Losses.PolicyLoss.mean": { |
|
"value": 0.018076893081888555, |
|
"min": 0.011601724340289365, |
|
"max": 0.02478181136199661, |
|
"count": 238 |
|
}, |
|
"SoccerTwos.Losses.PolicyLoss.sum": { |
|
"value": 0.018076893081888555, |
|
"min": 0.011601724340289365, |
|
"max": 0.02478181136199661, |
|
"count": 238 |
|
}, |
|
"SoccerTwos.Losses.ValueLoss.mean": { |
|
"value": 0.09370621119936308, |
|
"min": 9.677321001314946e-06, |
|
"max": 0.10801337112983068, |
|
"count": 238 |
|
}, |
|
"SoccerTwos.Losses.ValueLoss.sum": { |
|
"value": 0.09370621119936308, |
|
"min": 9.677321001314946e-06, |
|
"max": 0.10801337112983068, |
|
"count": 238 |
|
}, |
|
"SoccerTwos.Losses.BaselineLoss.mean": { |
|
"value": 0.09552678316831589, |
|
"min": 9.16501976462314e-06, |
|
"max": 0.11014168585340182, |
|
"count": 238 |
|
}, |
|
"SoccerTwos.Losses.BaselineLoss.sum": { |
|
"value": 0.09552678316831589, |
|
"min": 9.16501976462314e-06, |
|
"max": 0.11014168585340182, |
|
"count": 238 |
|
}, |
|
"SoccerTwos.Policy.LearningRate.mean": { |
|
"value": 0.0003, |
|
"min": 0.0003, |
|
"max": 0.0003, |
|
"count": 238 |
|
}, |
|
"SoccerTwos.Policy.LearningRate.sum": { |
|
"value": 0.0003, |
|
"min": 0.0003, |
|
"max": 0.0003, |
|
"count": 238 |
|
}, |
|
"SoccerTwos.Policy.Epsilon.mean": { |
|
"value": 0.20000000000000007, |
|
"min": 0.20000000000000007, |
|
"max": 0.20000000000000007, |
|
"count": 238 |
|
}, |
|
"SoccerTwos.Policy.Epsilon.sum": { |
|
"value": 0.20000000000000007, |
|
"min": 0.20000000000000007, |
|
"max": 0.20000000000000007, |
|
"count": 238 |
|
}, |
|
"SoccerTwos.Policy.Beta.mean": { |
|
"value": 0.005000000000000001, |
|
"min": 0.005000000000000001, |
|
"max": 0.005000000000000001, |
|
"count": 238 |
|
}, |
|
"SoccerTwos.Policy.Beta.sum": { |
|
"value": 0.005000000000000001, |
|
"min": 0.005000000000000001, |
|
"max": 0.005000000000000001, |
|
"count": 238 |
|
} |
|
}, |
|
"metadata": { |
|
"timer_format_version": "0.1.0", |
|
"start_time_seconds": "1726140025", |
|
"python_version": "3.10.12 (main, Jul 5 2023, 18:54:27) [GCC 11.2.0]", |
|
"command_line_arguments": "/home/ron/anaconda3/envs/rl/bin/mlagents-learn SoccerTwos.yaml --env=./training-envs-executables/SoccerTwos/SoccerTwos.x86_64 --run-id=SoccerTwos --no-graphics --force", |
|
"mlagents_version": "1.1.0.dev0", |
|
"mlagents_envs_version": "1.1.0.dev0", |
|
"communication_protocol_version": "1.5.0", |
|
"pytorch_version": "2.4.1+cu121", |
|
"numpy_version": "1.23.5", |
|
"end_time_seconds": "1726143333" |
|
}, |
|
"total": 3307.778840974999, |
|
"count": 1, |
|
"self": 0.16651327399449656, |
|
"children": { |
|
"run_training.setup": { |
|
"total": 0.017641124002693687, |
|
"count": 1, |
|
"self": 0.017641124002693687 |
|
}, |
|
"TrainerController.start_learning": { |
|
"total": 3307.594686577002, |
|
"count": 1, |
|
"self": 2.944197011049255, |
|
"children": { |
|
"TrainerController._reset_env": { |
|
"total": 1.430085665993829, |
|
"count": 25, |
|
"self": 1.430085665993829 |
|
}, |
|
"TrainerController.advance": { |
|
"total": 3303.1576436479554, |
|
"count": 335444, |
|
"self": 2.829188156807504, |
|
"children": { |
|
"env_step": { |
|
"total": 2603.5166298651347, |
|
"count": 335444, |
|
"self": 1883.2772055045607, |
|
"children": { |
|
"SubprocessEnvManager._take_step": { |
|
"total": 718.1913456719631, |
|
"count": 335444, |
|
"self": 21.45619433902175, |
|
"children": { |
|
"TorchPolicy.evaluate": { |
|
"total": 696.7351513329413, |
|
"count": 635164, |
|
"self": 696.7351513329413 |
|
} |
|
} |
|
}, |
|
"workers": { |
|
"total": 2.0480786886109854, |
|
"count": 335444, |
|
"self": 0.0, |
|
"children": { |
|
"worker_root": { |
|
"total": 3303.6074121928505, |
|
"count": 335444, |
|
"is_parallel": true, |
|
"self": 1771.8287012314358, |
|
"children": { |
|
"run_training.setup": { |
|
"total": 0.0, |
|
"count": 0, |
|
"is_parallel": true, |
|
"self": 0.0, |
|
"children": { |
|
"steps_from_proto": { |
|
"total": 0.0010473849979462102, |
|
"count": 2, |
|
"is_parallel": true, |
|
"self": 0.00022717300089425407, |
|
"children": { |
|
"_process_rank_one_or_two_observation": { |
|
"total": 0.0008202119970519561, |
|
"count": 8, |
|
"is_parallel": true, |
|
"self": 0.0008202119970519561 |
|
} |
|
} |
|
}, |
|
"UnityEnvironment.step": { |
|
"total": 0.011166587999468902, |
|
"count": 1, |
|
"is_parallel": true, |
|
"self": 0.00024985900017782114, |
|
"children": { |
|
"UnityEnvironment._generate_step_input": { |
|
"total": 0.00019514900122885592, |
|
"count": 1, |
|
"is_parallel": true, |
|
"self": 0.00019514900122885592 |
|
}, |
|
"communicator.exchange": { |
|
"total": 0.010036065999884158, |
|
"count": 1, |
|
"is_parallel": true, |
|
"self": 0.010036065999884158 |
|
}, |
|
"steps_from_proto": { |
|
"total": 0.0006855139981780667, |
|
"count": 2, |
|
"is_parallel": true, |
|
"self": 0.0001331999992544297, |
|
"children": { |
|
"_process_rank_one_or_two_observation": { |
|
"total": 0.000552313998923637, |
|
"count": 8, |
|
"is_parallel": true, |
|
"self": 0.000552313998923637 |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
}, |
|
"UnityEnvironment.step": { |
|
"total": 1531.7615807343973, |
|
"count": 335443, |
|
"is_parallel": true, |
|
"self": 89.4693392949739, |
|
"children": { |
|
"UnityEnvironment._generate_step_input": { |
|
"total": 52.059525609489356, |
|
"count": 335443, |
|
"is_parallel": true, |
|
"self": 52.059525609489356 |
|
}, |
|
"communicator.exchange": { |
|
"total": 1156.2756498972412, |
|
"count": 335443, |
|
"is_parallel": true, |
|
"self": 1156.2756498972412 |
|
}, |
|
"steps_from_proto": { |
|
"total": 233.95706593269279, |
|
"count": 670886, |
|
"is_parallel": true, |
|
"self": 43.36958953709109, |
|
"children": { |
|
"_process_rank_one_or_two_observation": { |
|
"total": 190.5874763956017, |
|
"count": 2683544, |
|
"is_parallel": true, |
|
"self": 190.5874763956017 |
|
} |
|
} |
|
} |
|
} |
|
}, |
|
"steps_from_proto": { |
|
"total": 0.0171302270173328, |
|
"count": 48, |
|
"is_parallel": true, |
|
"self": 0.003224001011403743, |
|
"children": { |
|
"_process_rank_one_or_two_observation": { |
|
"total": 0.013906226005929057, |
|
"count": 192, |
|
"is_parallel": true, |
|
"self": 0.013906226005929057 |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
}, |
|
"trainer_advance": { |
|
"total": 696.8118256260132, |
|
"count": 335444, |
|
"self": 23.83871245248156, |
|
"children": { |
|
"process_trajectory": { |
|
"total": 295.05417500857584, |
|
"count": 335444, |
|
"self": 294.34056990057434, |
|
"children": { |
|
"RLTrainer._checkpoint": { |
|
"total": 0.7136051080015022, |
|
"count": 10, |
|
"self": 0.7136051080015022 |
|
} |
|
} |
|
}, |
|
"_update_policy": { |
|
"total": 377.91893816495576, |
|
"count": 238, |
|
"self": 246.29837315572877, |
|
"children": { |
|
"TorchPOCAOptimizer.update": { |
|
"total": 131.620565009227, |
|
"count": 7140, |
|
"self": 131.620565009227 |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
}, |
|
"trainer_threads": { |
|
"total": 4.3200270738452673e-07, |
|
"count": 1, |
|
"self": 4.3200270738452673e-07 |
|
}, |
|
"TrainerController._save_models": { |
|
"total": 0.06275982000079239, |
|
"count": 1, |
|
"self": 0.0005887779989279807, |
|
"children": { |
|
"RLTrainer._checkpoint": { |
|
"total": 0.06217104200186441, |
|
"count": 1, |
|
"self": 0.06217104200186441 |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |