poca-SoccerTwos / run_logs /timers.json
saxelsso's picture
Second Push
dc68905 verified
{
"name": "root",
"gauges": {
"SoccerTwos.Policy.Entropy.mean": {
"value": 1.671779990196228,
"min": 1.483157753944397,
"max": 3.29573392868042,
"count": 2172
},
"SoccerTwos.Policy.Entropy.sum": {
"value": 33328.60546875,
"min": 21977.736328125,
"max": 113948.734375,
"count": 2172
},
"SoccerTwos.Environment.EpisodeLength.mean": {
"value": 60.44578313253012,
"min": 40.98360655737705,
"max": 999.0,
"count": 2172
},
"SoccerTwos.Environment.EpisodeLength.sum": {
"value": 20068.0,
"min": 7992.0,
"max": 30456.0,
"count": 2172
},
"SoccerTwos.Self-play.ELO.mean": {
"value": 1539.0438597037996,
"min": 1201.7416295213911,
"max": 1632.7729248992605,
"count": 2169
},
"SoccerTwos.Self-play.ELO.sum": {
"value": 255481.28071083073,
"min": 2407.9198778528084,
"max": 393499.67341582046,
"count": 2169
},
"SoccerTwos.Step.mean": {
"value": 21719990.0,
"min": 9976.0,
"max": 21719990.0,
"count": 2172
},
"SoccerTwos.Step.sum": {
"value": 21719990.0,
"min": 9976.0,
"max": 21719990.0,
"count": 2172
},
"SoccerTwos.Policy.ExtrinsicBaselineEstimate.mean": {
"value": -0.0039015451911836863,
"min": -0.16042177379131317,
"max": 0.18803301453590393,
"count": 2172
},
"SoccerTwos.Policy.ExtrinsicBaselineEstimate.sum": {
"value": -0.6437549591064453,
"min": -29.35718536376953,
"max": 25.85744285583496,
"count": 2172
},
"SoccerTwos.Policy.ExtrinsicValueEstimate.mean": {
"value": -0.0019325704779475927,
"min": -0.16366998851299286,
"max": 0.18803183734416962,
"count": 2172
},
"SoccerTwos.Policy.ExtrinsicValueEstimate.sum": {
"value": -0.3188741207122803,
"min": -29.809600830078125,
"max": 24.820201873779297,
"count": 2172
},
"SoccerTwos.Environment.CumulativeReward.mean": {
"value": 0.0,
"min": 0.0,
"max": 0.0,
"count": 2172
},
"SoccerTwos.Environment.CumulativeReward.sum": {
"value": 0.0,
"min": 0.0,
"max": 0.0,
"count": 2172
},
"SoccerTwos.Policy.ExtrinsicReward.mean": {
"value": 0.049229092308969206,
"min": -0.615013333161672,
"max": 0.49932221902741325,
"count": 2172
},
"SoccerTwos.Policy.ExtrinsicReward.sum": {
"value": 8.12280023097992,
"min": -58.684799790382385,
"max": 63.74240005016327,
"count": 2172
},
"SoccerTwos.Environment.GroupCumulativeReward.mean": {
"value": 0.049229092308969206,
"min": -0.615013333161672,
"max": 0.49932221902741325,
"count": 2172
},
"SoccerTwos.Environment.GroupCumulativeReward.sum": {
"value": 8.12280023097992,
"min": -58.684799790382385,
"max": 63.74240005016327,
"count": 2172
},
"SoccerTwos.IsTraining.mean": {
"value": 1.0,
"min": 1.0,
"max": 1.0,
"count": 2172
},
"SoccerTwos.IsTraining.sum": {
"value": 1.0,
"min": 1.0,
"max": 1.0,
"count": 2172
},
"SoccerTwos.Losses.PolicyLoss.mean": {
"value": 0.013729617009327436,
"min": 0.010989157442721383,
"max": 0.025509973475709557,
"count": 1052
},
"SoccerTwos.Losses.PolicyLoss.sum": {
"value": 0.013729617009327436,
"min": 0.010989157442721383,
"max": 0.025509973475709557,
"count": 1052
},
"SoccerTwos.Losses.ValueLoss.mean": {
"value": 0.1058132159213225,
"min": 0.0009146183729171753,
"max": 0.1211084894835949,
"count": 1052
},
"SoccerTwos.Losses.ValueLoss.sum": {
"value": 0.1058132159213225,
"min": 0.0009146183729171753,
"max": 0.1211084894835949,
"count": 1052
},
"SoccerTwos.Losses.BaselineLoss.mean": {
"value": 0.10755141600966453,
"min": 0.0009252421053436896,
"max": 0.12316837261120478,
"count": 1052
},
"SoccerTwos.Losses.BaselineLoss.sum": {
"value": 0.10755141600966453,
"min": 0.0009252421053436896,
"max": 0.12316837261120478,
"count": 1052
},
"SoccerTwos.Policy.LearningRate.mean": {
"value": 0.0003,
"min": 0.0003,
"max": 0.0003,
"count": 1052
},
"SoccerTwos.Policy.LearningRate.sum": {
"value": 0.0003,
"min": 0.0003,
"max": 0.0003,
"count": 1052
},
"SoccerTwos.Policy.Epsilon.mean": {
"value": 0.20000000000000007,
"min": 0.20000000000000004,
"max": 0.20000000000000007,
"count": 1052
},
"SoccerTwos.Policy.Epsilon.sum": {
"value": 0.20000000000000007,
"min": 0.20000000000000004,
"max": 0.20000000000000007,
"count": 1052
},
"SoccerTwos.Policy.Beta.mean": {
"value": 0.005000000000000001,
"min": 0.005000000000000001,
"max": 0.005000000000000001,
"count": 1052
},
"SoccerTwos.Policy.Beta.sum": {
"value": 0.005000000000000001,
"min": 0.005000000000000001,
"max": 0.005000000000000001,
"count": 1052
}
},
"metadata": {
"timer_format_version": "0.1.0",
"start_time_seconds": "1736415869",
"python_version": "3.10.12 (main, Jul 5 2023, 18:54:27) [GCC 11.2.0]",
"command_line_arguments": "/home/stefan/miniconda3/envs/ml-agents/bin/mlagents-learn ./config/poca/SoccerTwos.yaml --env=./training-envs-executables/SoccerTwos/SoccerTwos --run-id=SoccerTwos2 --no-graphics --torch-device cuda",
"mlagents_version": "1.2.0.dev0",
"mlagents_envs_version": "1.2.0.dev0",
"communication_protocol_version": "1.5.0",
"pytorch_version": "2.5.1+cu124",
"numpy_version": "1.23.5",
"end_time_seconds": "1736451844"
},
"total": 35974.67269840401,
"count": 1,
"self": 0.40740082100819563,
"children": {
"run_training.setup": {
"total": 0.010543634001805913,
"count": 1,
"self": 0.010543634001805913
},
"TrainerController.start_learning": {
"total": 35974.254753949,
"count": 1,
"self": 20.7283982641311,
"children": {
"TrainerController._reset_env": {
"total": 2.7039670909798588,
"count": 109,
"self": 2.7039670909798588
},
"TrainerController.advance": {
"total": 35950.661532302875,
"count": 1498144,
"self": 19.332999862155702,
"children": {
"env_step": {
"total": 27302.5172698968,
"count": 1498144,
"self": 16589.43508921757,
"children": {
"SubprocessEnvManager._take_step": {
"total": 10700.206373095512,
"count": 1498144,
"self": 123.36394279388333,
"children": {
"TorchPolicy.evaluate": {
"total": 10576.842430301629,
"count": 2730560,
"self": 10576.842430301629
}
}
},
"workers": {
"total": 12.875807583717688,
"count": 1498143,
"self": 0.0,
"children": {
"worker_root": {
"total": 35929.36511270509,
"count": 1498143,
"is_parallel": true,
"self": 21602.363495709753,
"children": {
"run_training.setup": {
"total": 0.0,
"count": 0,
"is_parallel": true,
"self": 0.0,
"children": {
"steps_from_proto": {
"total": 0.0017083109996747226,
"count": 2,
"is_parallel": true,
"self": 0.0005188049835851416,
"children": {
"_process_rank_one_or_two_observation": {
"total": 0.001189506016089581,
"count": 8,
"is_parallel": true,
"self": 0.001189506016089581
}
}
},
"UnityEnvironment.step": {
"total": 0.02624909100268269,
"count": 1,
"is_parallel": true,
"self": 0.00038735600537620485,
"children": {
"UnityEnvironment._generate_step_input": {
"total": 0.00039570599619764835,
"count": 1,
"is_parallel": true,
"self": 0.00039570599619764835
},
"communicator.exchange": {
"total": 0.024261833001219202,
"count": 1,
"is_parallel": true,
"self": 0.024261833001219202
},
"steps_from_proto": {
"total": 0.0012041959998896345,
"count": 2,
"is_parallel": true,
"self": 0.0002781369985314086,
"children": {
"_process_rank_one_or_two_observation": {
"total": 0.0009260590013582259,
"count": 8,
"is_parallel": true,
"self": 0.0009260590013582259
}
}
}
}
}
}
},
"UnityEnvironment.step": {
"total": 14326.880298964265,
"count": 1498142,
"is_parallel": true,
"self": 481.7784100755889,
"children": {
"UnityEnvironment._generate_step_input": {
"total": 320.9030825123482,
"count": 1498142,
"is_parallel": true,
"self": 320.9030825123482
},
"communicator.exchange": {
"total": 12007.851514953283,
"count": 1498142,
"is_parallel": true,
"self": 12007.851514953283
},
"steps_from_proto": {
"total": 1516.3472914230442,
"count": 2996284,
"is_parallel": true,
"self": 327.8235669827118,
"children": {
"_process_rank_one_or_two_observation": {
"total": 1188.5237244403324,
"count": 11985136,
"is_parallel": true,
"self": 1188.5237244403324
}
}
}
}
},
"steps_from_proto": {
"total": 0.12131803107331507,
"count": 216,
"is_parallel": true,
"self": 0.026903044199571013,
"children": {
"_process_rank_one_or_two_observation": {
"total": 0.09441498687374406,
"count": 864,
"is_parallel": true,
"self": 0.09441498687374406
}
}
}
}
}
}
}
}
},
"trainer_advance": {
"total": 8628.811262543917,
"count": 1498143,
"self": 161.23468632528238,
"children": {
"process_trajectory": {
"total": 5099.0348406058765,
"count": 1498143,
"self": 5092.362769061881,
"children": {
"RLTrainer._checkpoint": {
"total": 6.672071543995116,
"count": 43,
"self": 6.672071543995116
}
}
},
"_update_policy": {
"total": 3368.541735612758,
"count": 1052,
"self": 1602.0031282262353,
"children": {
"TorchPOCAOptimizer.update": {
"total": 1766.538607386523,
"count": 31569,
"self": 1766.538607386523
}
}
}
}
}
}
},
"trainer_threads": {
"total": 7.300113793462515e-07,
"count": 1,
"self": 7.300113793462515e-07
},
"TrainerController._save_models": {
"total": 0.16085556100006215,
"count": 1,
"self": 0.001240865996805951,
"children": {
"RLTrainer._checkpoint": {
"total": 0.1596146950032562,
"count": 1,
"self": 0.1596146950032562
}
}
}
}
}
}
}