poca-SoccerTwos / run_logs /timers.json
emmuzoo's picture
Second Push
01c4fee
{
"name": "root",
"gauges": {
"SoccerTwos.Policy.Entropy.mean": {
"value": 3.134723663330078,
"min": 3.134723663330078,
"max": 3.295743703842163,
"count": 200
},
"SoccerTwos.Policy.Entropy.sum": {
"value": 69014.078125,
"min": 23137.46484375,
"max": 112792.7890625,
"count": 200
},
"SoccerTwos.Environment.EpisodeLength.mean": {
"value": 670.1428571428571,
"min": 418.1818181818182,
"max": 999.0,
"count": 200
},
"SoccerTwos.Environment.EpisodeLength.sum": {
"value": 18764.0,
"min": 16544.0,
"max": 23560.0,
"count": 200
},
"SoccerTwos.Self-play.ELO.mean": {
"value": 1207.5592719658505,
"min": 1190.3462539934706,
"max": 1207.5592719658505,
"count": 165
},
"SoccerTwos.Self-play.ELO.sum": {
"value": 7245.355631795102,
"min": 2381.9796513433785,
"max": 21607.680104602616,
"count": 165
},
"SoccerTwos.Step.mean": {
"value": 1999164.0,
"min": 9140.0,
"max": 1999164.0,
"count": 200
},
"SoccerTwos.Step.sum": {
"value": 1999164.0,
"min": 9140.0,
"max": 1999164.0,
"count": 200
},
"SoccerTwos.Policy.ExtrinsicBaselineEstimate.mean": {
"value": -0.013440868817269802,
"min": -0.02255900204181671,
"max": 0.07795070856809616,
"count": 200
},
"SoccerTwos.Policy.ExtrinsicBaselineEstimate.sum": {
"value": -0.18817216157913208,
"min": -0.3406982421875,
"max": 1.5590142011642456,
"count": 200
},
"SoccerTwos.Policy.ExtrinsicValueEstimate.mean": {
"value": -0.011447346769273281,
"min": -0.02832871302962303,
"max": 0.07786843925714493,
"count": 200
},
"SoccerTwos.Policy.ExtrinsicValueEstimate.sum": {
"value": -0.1602628529071808,
"min": -0.4602850675582886,
"max": 1.5573687553405762,
"count": 200
},
"SoccerTwos.Environment.CumulativeReward.mean": {
"value": 0.0,
"min": 0.0,
"max": 0.0,
"count": 200
},
"SoccerTwos.Environment.CumulativeReward.sum": {
"value": 0.0,
"min": 0.0,
"max": 0.0,
"count": 200
},
"SoccerTwos.Policy.ExtrinsicReward.mean": {
"value": 0.3288285732269287,
"min": -0.6,
"max": 0.375925000756979,
"count": 200
},
"SoccerTwos.Policy.ExtrinsicReward.sum": {
"value": 4.603600025177002,
"min": -7.7368000745773315,
"max": 6.014800012111664,
"count": 200
},
"SoccerTwos.Environment.GroupCumulativeReward.mean": {
"value": 0.3288285732269287,
"min": -0.6,
"max": 0.375925000756979,
"count": 200
},
"SoccerTwos.Environment.GroupCumulativeReward.sum": {
"value": 4.603600025177002,
"min": -7.7368000745773315,
"max": 6.014800012111664,
"count": 200
},
"SoccerTwos.IsTraining.mean": {
"value": 1.0,
"min": 1.0,
"max": 1.0,
"count": 200
},
"SoccerTwos.IsTraining.sum": {
"value": 1.0,
"min": 1.0,
"max": 1.0,
"count": 200
},
"SoccerTwos.Losses.PolicyLoss.mean": {
"value": 0.016989466220062848,
"min": 0.011690640903058618,
"max": 0.02217564850967998,
"count": 93
},
"SoccerTwos.Losses.PolicyLoss.sum": {
"value": 0.016989466220062848,
"min": 0.011690640903058618,
"max": 0.02217564850967998,
"count": 93
},
"SoccerTwos.Losses.ValueLoss.mean": {
"value": 0.0025493189576081933,
"min": 2.715861914263466e-06,
"max": 0.01054837116971612,
"count": 93
},
"SoccerTwos.Losses.ValueLoss.sum": {
"value": 0.0025493189576081933,
"min": 2.715861914263466e-06,
"max": 0.01054837116971612,
"count": 93
},
"SoccerTwos.Losses.BaselineLoss.mean": {
"value": 0.002578929966936509,
"min": 2.2835658095724892e-06,
"max": 0.010203083076824744,
"count": 93
},
"SoccerTwos.Losses.BaselineLoss.sum": {
"value": 0.002578929966936509,
"min": 2.2835658095724892e-06,
"max": 0.010203083076824744,
"count": 93
},
"SoccerTwos.Policy.LearningRate.mean": {
"value": 0.0003,
"min": 0.0003,
"max": 0.0003,
"count": 93
},
"SoccerTwos.Policy.LearningRate.sum": {
"value": 0.0003,
"min": 0.0003,
"max": 0.0003,
"count": 93
},
"SoccerTwos.Policy.Epsilon.mean": {
"value": 0.20000000000000007,
"min": 0.2,
"max": 0.20000000000000007,
"count": 93
},
"SoccerTwos.Policy.Epsilon.sum": {
"value": 0.20000000000000007,
"min": 0.2,
"max": 0.20000000000000007,
"count": 93
},
"SoccerTwos.Policy.Beta.mean": {
"value": 0.005000000000000001,
"min": 0.005,
"max": 0.005000000000000001,
"count": 93
},
"SoccerTwos.Policy.Beta.sum": {
"value": 0.005000000000000001,
"min": 0.005,
"max": 0.005000000000000001,
"count": 93
}
},
"metadata": {
"timer_format_version": "0.1.0",
"start_time_seconds": "1681562902",
"python_version": "3.9.16 (main, Mar 8 2023, 14:00:05) \n[GCC 11.2.0]",
"command_line_arguments": "/home/aztleclan/training/moocs/huggingfaces/unit7/.conda/bin/mlagents-learn ./config/poca/SoccerTwos.yaml --env ./training-envs-executables/SoccerTwos/SoccerTwos.x86_64 --run-id=SoccerTwos --no-graphics",
"mlagents_version": "0.31.0.dev0",
"mlagents_envs_version": "0.31.0.dev0",
"communication_protocol_version": "1.5.0",
"pytorch_version": "1.11.0+cu102",
"numpy_version": "1.21.2",
"end_time_seconds": "1681566715"
},
"total": 3813.399794515999,
"count": 1,
"self": 0.3209155739987182,
"children": {
"run_training.setup": {
"total": 0.012022582000099646,
"count": 1,
"self": 0.012022582000099646
},
"TrainerController.start_learning": {
"total": 3813.06685636,
"count": 1,
"self": 2.9389210559420462,
"children": {
"TrainerController._reset_env": {
"total": 5.7804522669994185,
"count": 10,
"self": 5.7804522669994185
},
"TrainerController.advance": {
"total": 3804.0603381170595,
"count": 130218,
"self": 3.510101454347023,
"children": {
"env_step": {
"total": 2834.846090115796,
"count": 130218,
"self": 2204.7434627477887,
"children": {
"SubprocessEnvManager._take_step": {
"total": 628.1614574820524,
"count": 130218,
"self": 23.233958940654702,
"children": {
"TorchPolicy.evaluate": {
"total": 604.9274985413977,
"count": 258436,
"self": 604.9274985413977
}
}
},
"workers": {
"total": 1.9411698859548778,
"count": 130218,
"self": 0.0,
"children": {
"worker_root": {
"total": 3807.1614705310885,
"count": 130218,
"is_parallel": true,
"self": 1971.222390435908,
"children": {
"run_training.setup": {
"total": 0.0,
"count": 0,
"is_parallel": true,
"self": 0.0,
"children": {
"steps_from_proto": {
"total": 0.005138307999914105,
"count": 2,
"is_parallel": true,
"self": 0.001479011000810715,
"children": {
"_process_rank_one_or_two_observation": {
"total": 0.0036592969991033897,
"count": 8,
"is_parallel": true,
"self": 0.0036592969991033897
}
}
},
"UnityEnvironment.step": {
"total": 0.036166889000014635,
"count": 1,
"is_parallel": true,
"self": 0.001194107000628719,
"children": {
"UnityEnvironment._generate_step_input": {
"total": 0.0007146540001485846,
"count": 1,
"is_parallel": true,
"self": 0.0007146540001485846
},
"communicator.exchange": {
"total": 0.0314693599993916,
"count": 1,
"is_parallel": true,
"self": 0.0314693599993916
},
"steps_from_proto": {
"total": 0.0027887679998457315,
"count": 2,
"is_parallel": true,
"self": 0.0005849069984833477,
"children": {
"_process_rank_one_or_two_observation": {
"total": 0.002203861001362384,
"count": 8,
"is_parallel": true,
"self": 0.002203861001362384
}
}
}
}
}
}
},
"UnityEnvironment.step": {
"total": 1835.92103960018,
"count": 130217,
"is_parallel": true,
"self": 109.5906046352602,
"children": {
"UnityEnvironment._generate_step_input": {
"total": 64.5990994740423,
"count": 130217,
"is_parallel": true,
"self": 64.5990994740423
},
"communicator.exchange": {
"total": 1377.2451884587445,
"count": 130217,
"is_parallel": true,
"self": 1377.2451884587445
},
"steps_from_proto": {
"total": 284.486147032133,
"count": 260434,
"is_parallel": true,
"self": 54.12488937899434,
"children": {
"_process_rank_one_or_two_observation": {
"total": 230.36125765313864,
"count": 1041736,
"is_parallel": true,
"self": 230.36125765313864
}
}
}
}
},
"steps_from_proto": {
"total": 0.018040495000605006,
"count": 18,
"is_parallel": true,
"self": 0.0036618320027628215,
"children": {
"_process_rank_one_or_two_observation": {
"total": 0.014378662997842184,
"count": 72,
"is_parallel": true,
"self": 0.014378662997842184
}
}
}
}
}
}
}
}
},
"trainer_advance": {
"total": 965.7041465469165,
"count": 130218,
"self": 21.454896582661604,
"children": {
"process_trajectory": {
"total": 194.95743723825217,
"count": 130218,
"self": 193.74353206125124,
"children": {
"RLTrainer._checkpoint": {
"total": 1.2139051770009246,
"count": 4,
"self": 1.2139051770009246
}
}
},
"_update_policy": {
"total": 749.2918127260027,
"count": 93,
"self": 335.0551875339879,
"children": {
"TorchPOCAOptimizer.update": {
"total": 414.2366251920148,
"count": 2796,
"self": 414.2366251920148
}
}
}
}
}
}
},
"trainer_threads": {
"total": 8.160004654200748e-07,
"count": 1,
"self": 8.160004654200748e-07
},
"TrainerController._save_models": {
"total": 0.2871441039987985,
"count": 1,
"self": 0.002259959997900296,
"children": {
"RLTrainer._checkpoint": {
"total": 0.28488414400089823,
"count": 1,
"self": 0.28488414400089823
}
}
}
}
}
}
}