poca-SoccerTwos / run_logs /timers.json
Fer14's picture
First Push
985ec4f
{
"name": "root",
"gauges": {
"SoccerTwos.Policy.Entropy.mean": {
"value": 3.1573421955108643,
"min": 3.1193549633026123,
"max": 3.2956697940826416,
"count": 204
},
"SoccerTwos.Policy.Entropy.sum": {
"value": 91537.6640625,
"min": 22145.384765625,
"max": 113804.59375,
"count": 204
},
"SoccerTwos.Environment.EpisodeLength.mean": {
"value": 740.2857142857143,
"min": 471.5,
"max": 999.0,
"count": 204
},
"SoccerTwos.Environment.EpisodeLength.sum": {
"value": 20728.0,
"min": 13260.0,
"max": 28076.0,
"count": 204
},
"SoccerTwos.Self-play.ELO.mean": {
"value": 1196.044530811736,
"min": 1194.5995997367977,
"max": 1215.4939278097893,
"count": 159
},
"SoccerTwos.Self-play.ELO.sum": {
"value": 9568.356246493888,
"min": 2389.1991994735954,
"max": 14396.330814613222,
"count": 159
},
"SoccerTwos.Step.mean": {
"value": 2039646.0,
"min": 9054.0,
"max": 2039646.0,
"count": 204
},
"SoccerTwos.Step.sum": {
"value": 2039646.0,
"min": 9054.0,
"max": 2039646.0,
"count": 204
},
"SoccerTwos.Policy.ExtrinsicBaselineEstimate.mean": {
"value": 0.013888576999306679,
"min": -0.013252537697553635,
"max": 0.05611197650432587,
"count": 204
},
"SoccerTwos.Policy.ExtrinsicBaselineEstimate.sum": {
"value": 0.1944400817155838,
"min": -0.2175348848104477,
"max": 0.8977916240692139,
"count": 204
},
"SoccerTwos.Policy.ExtrinsicValueEstimate.mean": {
"value": 0.014462905004620552,
"min": -0.012911916710436344,
"max": 0.056133802980184555,
"count": 204
},
"SoccerTwos.Policy.ExtrinsicValueEstimate.sum": {
"value": 0.20248067378997803,
"min": -0.21378286182880402,
"max": 0.8981384038925171,
"count": 204
},
"SoccerTwos.Environment.CumulativeReward.mean": {
"value": 0.0,
"min": 0.0,
"max": 0.0,
"count": 204
},
"SoccerTwos.Environment.CumulativeReward.sum": {
"value": 0.0,
"min": 0.0,
"max": 0.0,
"count": 204
},
"SoccerTwos.Policy.ExtrinsicReward.mean": {
"value": 0.019714287349155972,
"min": -0.5625,
"max": 0.34826666514078775,
"count": 204
},
"SoccerTwos.Policy.ExtrinsicReward.sum": {
"value": 0.2760000228881836,
"min": -9.0,
"max": 5.359999984502792,
"count": 204
},
"SoccerTwos.Environment.GroupCumulativeReward.mean": {
"value": 0.019714287349155972,
"min": -0.5625,
"max": 0.34826666514078775,
"count": 204
},
"SoccerTwos.Environment.GroupCumulativeReward.sum": {
"value": 0.2760000228881836,
"min": -9.0,
"max": 5.359999984502792,
"count": 204
},
"SoccerTwos.IsTraining.mean": {
"value": 1.0,
"min": 1.0,
"max": 1.0,
"count": 204
},
"SoccerTwos.IsTraining.sum": {
"value": 1.0,
"min": 1.0,
"max": 1.0,
"count": 204
},
"SoccerTwos.Losses.PolicyLoss.mean": {
"value": 0.016578856820706277,
"min": 0.0104911725250228,
"max": 0.023848259889443096,
"count": 95
},
"SoccerTwos.Losses.PolicyLoss.sum": {
"value": 0.016578856820706277,
"min": 0.0104911725250228,
"max": 0.023848259889443096,
"count": 95
},
"SoccerTwos.Losses.ValueLoss.mean": {
"value": 0.004163745751914878,
"min": 2.5253433932448386e-06,
"max": 0.0048438915982842445,
"count": 95
},
"SoccerTwos.Losses.ValueLoss.sum": {
"value": 0.004163745751914878,
"min": 2.5253433932448386e-06,
"max": 0.0048438915982842445,
"count": 95
},
"SoccerTwos.Losses.BaselineLoss.mean": {
"value": 0.004275392834097147,
"min": 2.5751679269584807e-06,
"max": 0.004879755914832155,
"count": 95
},
"SoccerTwos.Losses.BaselineLoss.sum": {
"value": 0.004275392834097147,
"min": 2.5751679269584807e-06,
"max": 0.004879755914832155,
"count": 95
},
"SoccerTwos.Policy.LearningRate.mean": {
"value": 0.0003,
"min": 0.0003,
"max": 0.0003,
"count": 95
},
"SoccerTwos.Policy.LearningRate.sum": {
"value": 0.0003,
"min": 0.0003,
"max": 0.0003,
"count": 95
},
"SoccerTwos.Policy.Epsilon.mean": {
"value": 0.20000000000000007,
"min": 0.20000000000000007,
"max": 0.20000000000000007,
"count": 95
},
"SoccerTwos.Policy.Epsilon.sum": {
"value": 0.20000000000000007,
"min": 0.20000000000000007,
"max": 0.20000000000000007,
"count": 95
},
"SoccerTwos.Policy.Beta.mean": {
"value": 0.005000000000000001,
"min": 0.005000000000000001,
"max": 0.005000000000000001,
"count": 95
},
"SoccerTwos.Policy.Beta.sum": {
"value": 0.005000000000000001,
"min": 0.005000000000000001,
"max": 0.005000000000000001,
"count": 95
}
},
"metadata": {
"timer_format_version": "0.1.0",
"start_time_seconds": "1678549238",
"python_version": "3.9.16 (main, Mar 8 2023, 14:00:05) \n[GCC 11.2.0]",
"command_line_arguments": "/home/fer/miniconda3/envs/rl/bin/mlagents-learn ./SoccerTwos.yaml --env=./SoccerTwos/SoccerTwos.x86_64 --run-id=SoccerTwos --no-graphics --force",
"mlagents_version": "0.31.0.dev0",
"mlagents_envs_version": "0.31.0.dev0",
"communication_protocol_version": "1.5.0",
"pytorch_version": "1.11.0+cu113",
"numpy_version": "1.21.2",
"end_time_seconds": "1678551788"
},
"total": 2549.631119179001,
"count": 1,
"self": 0.052769633000934846,
"children": {
"run_training.setup": {
"total": 0.007245131999297882,
"count": 1,
"self": 0.007245131999297882
},
"TrainerController.start_learning": {
"total": 2549.5711044140007,
"count": 1,
"self": 2.7172993279000366,
"children": {
"TrainerController._reset_env": {
"total": 4.349112961001083,
"count": 11,
"self": 4.349112961001083
},
"TrainerController.advance": {
"total": 2542.3395385041003,
"count": 133268,
"self": 3.1790522586106817,
"children": {
"env_step": {
"total": 1984.838998668829,
"count": 133268,
"self": 1421.5724086424852,
"children": {
"SubprocessEnvManager._take_step": {
"total": 561.4521566224412,
"count": 133268,
"self": 15.476844517868813,
"children": {
"TorchPolicy.evaluate": {
"total": 545.9753121045724,
"count": 264599,
"self": 545.9753121045724
}
}
},
"workers": {
"total": 1.8144334039025125,
"count": 133267,
"self": 0.0,
"children": {
"worker_root": {
"total": 2545.490670408546,
"count": 133267,
"is_parallel": true,
"self": 1425.9446901018728,
"children": {
"run_training.setup": {
"total": 0.0,
"count": 0,
"is_parallel": true,
"self": 0.0,
"children": {
"steps_from_proto": {
"total": 0.001545119999718736,
"count": 2,
"is_parallel": true,
"self": 0.0004526110005826922,
"children": {
"_process_rank_one_or_two_observation": {
"total": 0.0010925089991360437,
"count": 8,
"is_parallel": true,
"self": 0.0010925089991360437
}
}
},
"UnityEnvironment.step": {
"total": 0.019817124000837794,
"count": 1,
"is_parallel": true,
"self": 0.0004965509997418849,
"children": {
"UnityEnvironment._generate_step_input": {
"total": 0.00046378200022445526,
"count": 1,
"is_parallel": true,
"self": 0.00046378200022445526
},
"communicator.exchange": {
"total": 0.01740983200033952,
"count": 1,
"is_parallel": true,
"self": 0.01740983200033952
},
"steps_from_proto": {
"total": 0.0014469590005319333,
"count": 2,
"is_parallel": true,
"self": 0.0002938880024885293,
"children": {
"_process_rank_one_or_two_observation": {
"total": 0.001153070998043404,
"count": 8,
"is_parallel": true,
"self": 0.001153070998043404
}
}
}
}
}
}
},
"UnityEnvironment.step": {
"total": 1119.531721983678,
"count": 133266,
"is_parallel": true,
"self": 68.2219598996544,
"children": {
"UnityEnvironment._generate_step_input": {
"total": 47.15250782205294,
"count": 133266,
"is_parallel": true,
"self": 47.15250782205294
},
"communicator.exchange": {
"total": 810.4720720318765,
"count": 133266,
"is_parallel": true,
"self": 810.4720720318765
},
"steps_from_proto": {
"total": 193.68518223009414,
"count": 266532,
"is_parallel": true,
"self": 37.63077084696488,
"children": {
"_process_rank_one_or_two_observation": {
"total": 156.05441138312926,
"count": 1066128,
"is_parallel": true,
"self": 156.05441138312926
}
}
}
}
},
"steps_from_proto": {
"total": 0.014258322995374328,
"count": 20,
"is_parallel": true,
"self": 0.0028566979963216,
"children": {
"_process_rank_one_or_two_observation": {
"total": 0.011401624999052729,
"count": 80,
"is_parallel": true,
"self": 0.011401624999052729
}
}
}
}
}
}
}
}
},
"trainer_advance": {
"total": 554.3214875766607,
"count": 133267,
"self": 24.025186708360707,
"children": {
"process_trajectory": {
"total": 149.61244848931165,
"count": 133267,
"self": 148.90445992631066,
"children": {
"RLTrainer._checkpoint": {
"total": 0.7079885630009812,
"count": 4,
"self": 0.7079885630009812
}
}
},
"_update_policy": {
"total": 380.6838523789884,
"count": 95,
"self": 218.16326152800502,
"children": {
"TorchPOCAOptimizer.update": {
"total": 162.52059085098335,
"count": 2850,
"self": 162.52059085098335
}
}
}
}
}
}
},
"trainer_threads": {
"total": 8.319984772242606e-07,
"count": 1,
"self": 8.319984772242606e-07
},
"TrainerController._save_models": {
"total": 0.16515278900078556,
"count": 1,
"self": 0.0012243510009284364,
"children": {
"RLTrainer._checkpoint": {
"total": 0.16392843799985712,
"count": 1,
"self": 0.16392843799985712
}
}
}
}
}
}
}