|
{ |
|
"name": "root", |
|
"gauges": { |
|
"SoccerTwos.Policy.Entropy.mean": { |
|
"value": 3.1573421955108643, |
|
"min": 3.1193549633026123, |
|
"max": 3.2956697940826416, |
|
"count": 204 |
|
}, |
|
"SoccerTwos.Policy.Entropy.sum": { |
|
"value": 91537.6640625, |
|
"min": 22145.384765625, |
|
"max": 113804.59375, |
|
"count": 204 |
|
}, |
|
"SoccerTwos.Environment.EpisodeLength.mean": { |
|
"value": 740.2857142857143, |
|
"min": 471.5, |
|
"max": 999.0, |
|
"count": 204 |
|
}, |
|
"SoccerTwos.Environment.EpisodeLength.sum": { |
|
"value": 20728.0, |
|
"min": 13260.0, |
|
"max": 28076.0, |
|
"count": 204 |
|
}, |
|
"SoccerTwos.Self-play.ELO.mean": { |
|
"value": 1196.044530811736, |
|
"min": 1194.5995997367977, |
|
"max": 1215.4939278097893, |
|
"count": 159 |
|
}, |
|
"SoccerTwos.Self-play.ELO.sum": { |
|
"value": 9568.356246493888, |
|
"min": 2389.1991994735954, |
|
"max": 14396.330814613222, |
|
"count": 159 |
|
}, |
|
"SoccerTwos.Step.mean": { |
|
"value": 2039646.0, |
|
"min": 9054.0, |
|
"max": 2039646.0, |
|
"count": 204 |
|
}, |
|
"SoccerTwos.Step.sum": { |
|
"value": 2039646.0, |
|
"min": 9054.0, |
|
"max": 2039646.0, |
|
"count": 204 |
|
}, |
|
"SoccerTwos.Policy.ExtrinsicBaselineEstimate.mean": { |
|
"value": 0.013888576999306679, |
|
"min": -0.013252537697553635, |
|
"max": 0.05611197650432587, |
|
"count": 204 |
|
}, |
|
"SoccerTwos.Policy.ExtrinsicBaselineEstimate.sum": { |
|
"value": 0.1944400817155838, |
|
"min": -0.2175348848104477, |
|
"max": 0.8977916240692139, |
|
"count": 204 |
|
}, |
|
"SoccerTwos.Policy.ExtrinsicValueEstimate.mean": { |
|
"value": 0.014462905004620552, |
|
"min": -0.012911916710436344, |
|
"max": 0.056133802980184555, |
|
"count": 204 |
|
}, |
|
"SoccerTwos.Policy.ExtrinsicValueEstimate.sum": { |
|
"value": 0.20248067378997803, |
|
"min": -0.21378286182880402, |
|
"max": 0.8981384038925171, |
|
"count": 204 |
|
}, |
|
"SoccerTwos.Environment.CumulativeReward.mean": { |
|
"value": 0.0, |
|
"min": 0.0, |
|
"max": 0.0, |
|
"count": 204 |
|
}, |
|
"SoccerTwos.Environment.CumulativeReward.sum": { |
|
"value": 0.0, |
|
"min": 0.0, |
|
"max": 0.0, |
|
"count": 204 |
|
}, |
|
"SoccerTwos.Policy.ExtrinsicReward.mean": { |
|
"value": 0.019714287349155972, |
|
"min": -0.5625, |
|
"max": 0.34826666514078775, |
|
"count": 204 |
|
}, |
|
"SoccerTwos.Policy.ExtrinsicReward.sum": { |
|
"value": 0.2760000228881836, |
|
"min": -9.0, |
|
"max": 5.359999984502792, |
|
"count": 204 |
|
}, |
|
"SoccerTwos.Environment.GroupCumulativeReward.mean": { |
|
"value": 0.019714287349155972, |
|
"min": -0.5625, |
|
"max": 0.34826666514078775, |
|
"count": 204 |
|
}, |
|
"SoccerTwos.Environment.GroupCumulativeReward.sum": { |
|
"value": 0.2760000228881836, |
|
"min": -9.0, |
|
"max": 5.359999984502792, |
|
"count": 204 |
|
}, |
|
"SoccerTwos.IsTraining.mean": { |
|
"value": 1.0, |
|
"min": 1.0, |
|
"max": 1.0, |
|
"count": 204 |
|
}, |
|
"SoccerTwos.IsTraining.sum": { |
|
"value": 1.0, |
|
"min": 1.0, |
|
"max": 1.0, |
|
"count": 204 |
|
}, |
|
"SoccerTwos.Losses.PolicyLoss.mean": { |
|
"value": 0.016578856820706277, |
|
"min": 0.0104911725250228, |
|
"max": 0.023848259889443096, |
|
"count": 95 |
|
}, |
|
"SoccerTwos.Losses.PolicyLoss.sum": { |
|
"value": 0.016578856820706277, |
|
"min": 0.0104911725250228, |
|
"max": 0.023848259889443096, |
|
"count": 95 |
|
}, |
|
"SoccerTwos.Losses.ValueLoss.mean": { |
|
"value": 0.004163745751914878, |
|
"min": 2.5253433932448386e-06, |
|
"max": 0.0048438915982842445, |
|
"count": 95 |
|
}, |
|
"SoccerTwos.Losses.ValueLoss.sum": { |
|
"value": 0.004163745751914878, |
|
"min": 2.5253433932448386e-06, |
|
"max": 0.0048438915982842445, |
|
"count": 95 |
|
}, |
|
"SoccerTwos.Losses.BaselineLoss.mean": { |
|
"value": 0.004275392834097147, |
|
"min": 2.5751679269584807e-06, |
|
"max": 0.004879755914832155, |
|
"count": 95 |
|
}, |
|
"SoccerTwos.Losses.BaselineLoss.sum": { |
|
"value": 0.004275392834097147, |
|
"min": 2.5751679269584807e-06, |
|
"max": 0.004879755914832155, |
|
"count": 95 |
|
}, |
|
"SoccerTwos.Policy.LearningRate.mean": { |
|
"value": 0.0003, |
|
"min": 0.0003, |
|
"max": 0.0003, |
|
"count": 95 |
|
}, |
|
"SoccerTwos.Policy.LearningRate.sum": { |
|
"value": 0.0003, |
|
"min": 0.0003, |
|
"max": 0.0003, |
|
"count": 95 |
|
}, |
|
"SoccerTwos.Policy.Epsilon.mean": { |
|
"value": 0.20000000000000007, |
|
"min": 0.20000000000000007, |
|
"max": 0.20000000000000007, |
|
"count": 95 |
|
}, |
|
"SoccerTwos.Policy.Epsilon.sum": { |
|
"value": 0.20000000000000007, |
|
"min": 0.20000000000000007, |
|
"max": 0.20000000000000007, |
|
"count": 95 |
|
}, |
|
"SoccerTwos.Policy.Beta.mean": { |
|
"value": 0.005000000000000001, |
|
"min": 0.005000000000000001, |
|
"max": 0.005000000000000001, |
|
"count": 95 |
|
}, |
|
"SoccerTwos.Policy.Beta.sum": { |
|
"value": 0.005000000000000001, |
|
"min": 0.005000000000000001, |
|
"max": 0.005000000000000001, |
|
"count": 95 |
|
} |
|
}, |
|
"metadata": { |
|
"timer_format_version": "0.1.0", |
|
"start_time_seconds": "1678549238", |
|
"python_version": "3.9.16 (main, Mar 8 2023, 14:00:05) \n[GCC 11.2.0]", |
|
"command_line_arguments": "/home/fer/miniconda3/envs/rl/bin/mlagents-learn ./SoccerTwos.yaml --env=./SoccerTwos/SoccerTwos.x86_64 --run-id=SoccerTwos --no-graphics --force", |
|
"mlagents_version": "0.31.0.dev0", |
|
"mlagents_envs_version": "0.31.0.dev0", |
|
"communication_protocol_version": "1.5.0", |
|
"pytorch_version": "1.11.0+cu113", |
|
"numpy_version": "1.21.2", |
|
"end_time_seconds": "1678551788" |
|
}, |
|
"total": 2549.631119179001, |
|
"count": 1, |
|
"self": 0.052769633000934846, |
|
"children": { |
|
"run_training.setup": { |
|
"total": 0.007245131999297882, |
|
"count": 1, |
|
"self": 0.007245131999297882 |
|
}, |
|
"TrainerController.start_learning": { |
|
"total": 2549.5711044140007, |
|
"count": 1, |
|
"self": 2.7172993279000366, |
|
"children": { |
|
"TrainerController._reset_env": { |
|
"total": 4.349112961001083, |
|
"count": 11, |
|
"self": 4.349112961001083 |
|
}, |
|
"TrainerController.advance": { |
|
"total": 2542.3395385041003, |
|
"count": 133268, |
|
"self": 3.1790522586106817, |
|
"children": { |
|
"env_step": { |
|
"total": 1984.838998668829, |
|
"count": 133268, |
|
"self": 1421.5724086424852, |
|
"children": { |
|
"SubprocessEnvManager._take_step": { |
|
"total": 561.4521566224412, |
|
"count": 133268, |
|
"self": 15.476844517868813, |
|
"children": { |
|
"TorchPolicy.evaluate": { |
|
"total": 545.9753121045724, |
|
"count": 264599, |
|
"self": 545.9753121045724 |
|
} |
|
} |
|
}, |
|
"workers": { |
|
"total": 1.8144334039025125, |
|
"count": 133267, |
|
"self": 0.0, |
|
"children": { |
|
"worker_root": { |
|
"total": 2545.490670408546, |
|
"count": 133267, |
|
"is_parallel": true, |
|
"self": 1425.9446901018728, |
|
"children": { |
|
"run_training.setup": { |
|
"total": 0.0, |
|
"count": 0, |
|
"is_parallel": true, |
|
"self": 0.0, |
|
"children": { |
|
"steps_from_proto": { |
|
"total": 0.001545119999718736, |
|
"count": 2, |
|
"is_parallel": true, |
|
"self": 0.0004526110005826922, |
|
"children": { |
|
"_process_rank_one_or_two_observation": { |
|
"total": 0.0010925089991360437, |
|
"count": 8, |
|
"is_parallel": true, |
|
"self": 0.0010925089991360437 |
|
} |
|
} |
|
}, |
|
"UnityEnvironment.step": { |
|
"total": 0.019817124000837794, |
|
"count": 1, |
|
"is_parallel": true, |
|
"self": 0.0004965509997418849, |
|
"children": { |
|
"UnityEnvironment._generate_step_input": { |
|
"total": 0.00046378200022445526, |
|
"count": 1, |
|
"is_parallel": true, |
|
"self": 0.00046378200022445526 |
|
}, |
|
"communicator.exchange": { |
|
"total": 0.01740983200033952, |
|
"count": 1, |
|
"is_parallel": true, |
|
"self": 0.01740983200033952 |
|
}, |
|
"steps_from_proto": { |
|
"total": 0.0014469590005319333, |
|
"count": 2, |
|
"is_parallel": true, |
|
"self": 0.0002938880024885293, |
|
"children": { |
|
"_process_rank_one_or_two_observation": { |
|
"total": 0.001153070998043404, |
|
"count": 8, |
|
"is_parallel": true, |
|
"self": 0.001153070998043404 |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
}, |
|
"UnityEnvironment.step": { |
|
"total": 1119.531721983678, |
|
"count": 133266, |
|
"is_parallel": true, |
|
"self": 68.2219598996544, |
|
"children": { |
|
"UnityEnvironment._generate_step_input": { |
|
"total": 47.15250782205294, |
|
"count": 133266, |
|
"is_parallel": true, |
|
"self": 47.15250782205294 |
|
}, |
|
"communicator.exchange": { |
|
"total": 810.4720720318765, |
|
"count": 133266, |
|
"is_parallel": true, |
|
"self": 810.4720720318765 |
|
}, |
|
"steps_from_proto": { |
|
"total": 193.68518223009414, |
|
"count": 266532, |
|
"is_parallel": true, |
|
"self": 37.63077084696488, |
|
"children": { |
|
"_process_rank_one_or_two_observation": { |
|
"total": 156.05441138312926, |
|
"count": 1066128, |
|
"is_parallel": true, |
|
"self": 156.05441138312926 |
|
} |
|
} |
|
} |
|
} |
|
}, |
|
"steps_from_proto": { |
|
"total": 0.014258322995374328, |
|
"count": 20, |
|
"is_parallel": true, |
|
"self": 0.0028566979963216, |
|
"children": { |
|
"_process_rank_one_or_two_observation": { |
|
"total": 0.011401624999052729, |
|
"count": 80, |
|
"is_parallel": true, |
|
"self": 0.011401624999052729 |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
}, |
|
"trainer_advance": { |
|
"total": 554.3214875766607, |
|
"count": 133267, |
|
"self": 24.025186708360707, |
|
"children": { |
|
"process_trajectory": { |
|
"total": 149.61244848931165, |
|
"count": 133267, |
|
"self": 148.90445992631066, |
|
"children": { |
|
"RLTrainer._checkpoint": { |
|
"total": 0.7079885630009812, |
|
"count": 4, |
|
"self": 0.7079885630009812 |
|
} |
|
} |
|
}, |
|
"_update_policy": { |
|
"total": 380.6838523789884, |
|
"count": 95, |
|
"self": 218.16326152800502, |
|
"children": { |
|
"TorchPOCAOptimizer.update": { |
|
"total": 162.52059085098335, |
|
"count": 2850, |
|
"self": 162.52059085098335 |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
}, |
|
"trainer_threads": { |
|
"total": 8.319984772242606e-07, |
|
"count": 1, |
|
"self": 8.319984772242606e-07 |
|
}, |
|
"TrainerController._save_models": { |
|
"total": 0.16515278900078556, |
|
"count": 1, |
|
"self": 0.0012243510009284364, |
|
"children": { |
|
"RLTrainer._checkpoint": { |
|
"total": 0.16392843799985712, |
|
"count": 1, |
|
"self": 0.16392843799985712 |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |