poca-test4 / run_logs /timers.json
QYHcrossover's picture
First Commit
043e64d
{
"name": "root",
"gauges": {
"SoccerTwos.Policy.Entropy.mean": {
"value": 0.866117000579834,
"min": 0.8086401224136353,
"max": 2.135493516921997,
"count": 14989
},
"SoccerTwos.Policy.Entropy.sum": {
"value": 18708.126953125,
"min": 10466.740234375,
"max": 105615.1484375,
"count": 14989
},
"SoccerTwos.Environment.EpisodeLength.mean": {
"value": 66.29166666666667,
"min": 26.98324022346369,
"max": 125.325,
"count": 14989
},
"SoccerTwos.Environment.EpisodeLength.sum": {
"value": 19092.0,
"min": 14712.0,
"max": 22936.0,
"count": 14989
},
"SoccerTwos.Self-play.ELO.mean": {
"value": 1707.7936415009024,
"min": 1549.168502889312,
"max": 1746.4515803198233,
"count": 14989
},
"SoccerTwos.Self-play.ELO.sum": {
"value": 245922.28437612994,
"min": 120430.73786124286,
"max": 605872.0984318862,
"count": 14989
},
"SoccerTwos.Step.mean": {
"value": 199999964.0,
"min": 50119986.0,
"max": 199999964.0,
"count": 14989
},
"SoccerTwos.Step.sum": {
"value": 199999964.0,
"min": 50119986.0,
"max": 199999964.0,
"count": 14989
},
"SoccerTwos.Policy.ExtrinsicBaselineEstimate.mean": {
"value": -0.04558149352669716,
"min": -0.16296879947185516,
"max": 0.10279054194688797,
"count": 14989
},
"SoccerTwos.Policy.ExtrinsicBaselineEstimate.sum": {
"value": -6.700479507446289,
"min": -33.77891540527344,
"max": 16.427635192871094,
"count": 14989
},
"SoccerTwos.Policy.ExtrinsicValueEstimate.mean": {
"value": -0.04524017497897148,
"min": -0.16307416558265686,
"max": 0.10262896120548248,
"count": 14989
},
"SoccerTwos.Policy.ExtrinsicValueEstimate.sum": {
"value": -6.65030574798584,
"min": -34.11742401123047,
"max": 16.870479583740234,
"count": 14989
},
"SoccerTwos.Environment.CumulativeReward.mean": {
"value": 0.0,
"min": 0.0,
"max": 0.0,
"count": 14989
},
"SoccerTwos.Environment.CumulativeReward.sum": {
"value": 0.0,
"min": 0.0,
"max": 0.0,
"count": 14989
},
"SoccerTwos.Policy.ExtrinsicReward.mean": {
"value": -0.17092517241328753,
"min": -0.47276239211742693,
"max": 0.5691900824712328,
"count": 14989
},
"SoccerTwos.Policy.ExtrinsicReward.sum": {
"value": -25.126000344753265,
"min": -87.17599999904633,
"max": 83.58380001783371,
"count": 14989
},
"SoccerTwos.Environment.GroupCumulativeReward.mean": {
"value": -0.17092517241328753,
"min": -0.47276239211742693,
"max": 0.5691900824712328,
"count": 14989
},
"SoccerTwos.Environment.GroupCumulativeReward.sum": {
"value": -25.126000344753265,
"min": -87.17599999904633,
"max": 83.58380001783371,
"count": 14989
},
"SoccerTwos.IsTraining.mean": {
"value": 1.0,
"min": 1.0,
"max": 1.0,
"count": 14989
},
"SoccerTwos.IsTraining.sum": {
"value": 1.0,
"min": 1.0,
"max": 1.0,
"count": 14989
},
"SoccerTwos.Losses.PolicyLoss.mean": {
"value": 0.018238363913648453,
"min": 0.008571711436282688,
"max": 0.026601446373388172,
"count": 7245
},
"SoccerTwos.Losses.PolicyLoss.sum": {
"value": 0.018238363913648453,
"min": 0.008571711436282688,
"max": 0.026601446373388172,
"count": 7245
},
"SoccerTwos.Losses.ValueLoss.mean": {
"value": 0.09880388751626015,
"min": 0.06719134338200092,
"max": 0.15229609956343967,
"count": 7245
},
"SoccerTwos.Losses.ValueLoss.sum": {
"value": 0.09880388751626015,
"min": 0.06719134338200092,
"max": 0.15229609956343967,
"count": 7245
},
"SoccerTwos.Losses.BaselineLoss.mean": {
"value": 0.09918721541762351,
"min": 0.06746410404642424,
"max": 0.15259439150492352,
"count": 7245
},
"SoccerTwos.Losses.BaselineLoss.sum": {
"value": 0.09918721541762351,
"min": 0.06746410404642424,
"max": 0.15259439150492352,
"count": 7245
},
"SoccerTwos.Policy.LearningRate.mean": {
"value": 6.048997025493988e-09,
"min": 6.048997025493988e-09,
"max": 0.0001498667620666315,
"count": 7245
},
"SoccerTwos.Policy.LearningRate.sum": {
"value": 6.048997025493988e-09,
"min": 6.048997025493988e-09,
"max": 0.0001498667620666315,
"count": 7245
},
"SoccerTwos.Policy.Epsilon.mean": {
"value": 0.20000000000000007,
"min": 0.20000000000000007,
"max": 0.20000000000000007,
"count": 7245
},
"SoccerTwos.Policy.Epsilon.sum": {
"value": 0.20000000000000007,
"min": 0.20000000000000007,
"max": 0.20000000000000007,
"count": 7245
},
"SoccerTwos.Policy.Beta.mean": {
"value": 1.0297152549999698e-05,
"min": 1.0297152549999698e-05,
"max": 0.00749584351315,
"count": 7245
},
"SoccerTwos.Policy.Beta.sum": {
"value": 1.0297152549999698e-05,
"min": 1.0297152549999698e-05,
"max": 0.00749584351315,
"count": 7245
}
},
"metadata": {
"timer_format_version": "0.1.0",
"start_time_seconds": "1681458589",
"python_version": "3.9.16 (main, Mar 8 2023, 14:00:05) \n[GCC 11.2.0]",
"command_line_arguments": "/data/qyh/env/ml-agents/bin/mlagents-learn ./results/configuration.yaml",
"mlagents_version": "0.31.0.dev0",
"mlagents_envs_version": "0.31.0.dev0",
"communication_protocol_version": "1.5.0",
"pytorch_version": "1.11.0+cu102",
"numpy_version": "1.21.2",
"end_time_seconds": "1681660711"
},
"total": 202121.95327740815,
"count": 1,
"self": 0.7371731949970126,
"children": {
"run_training.setup": {
"total": 0.08580901497043669,
"count": 1,
"self": 0.08580901497043669
},
"TrainerController.start_learning": {
"total": 202121.13029519818,
"count": 1,
"self": 75.58960591861978,
"children": {
"TrainerController._reset_env": {
"total": 239.88585016061552,
"count": 750,
"self": 239.88585016061552
},
"TrainerController.advance": {
"total": 201805.20052092662,
"count": 889082,
"self": 43.436931712087244,
"children": {
"env_step": {
"total": 109403.14526834106,
"count": 889082,
"self": 35718.75220445846,
"children": {
"SubprocessEnvManager._take_step": {
"total": 73588.09211776033,
"count": 11064486,
"self": 1956.4829019042663,
"children": {
"TorchPolicy.evaluate": {
"total": 71631.60921585606,
"count": 20304662,
"self": 71631.60921585606
}
}
},
"workers": {
"total": 96.30094612226821,
"count": 889082,
"self": 0.0,
"children": {
"worker_root": {
"total": 3786373.531351197,
"count": 11061955,
"is_parallel": true,
"self": 3543006.6518733725,
"children": {
"run_training.setup": {
"total": 1.372944239526987,
"count": 16,
"is_parallel": true,
"self": 0.8564431574195623,
"children": {
"steps_from_proto": {
"total": 0.05167464469559491,
"count": 20,
"is_parallel": true,
"self": 0.012508621672168374,
"children": {
"_process_rank_one_or_two_observation": {
"total": 0.03916602302342653,
"count": 80,
"is_parallel": true,
"self": 0.03916602302342653
}
}
},
"UnityEnvironment.step": {
"total": 0.46482643741182983,
"count": 10,
"is_parallel": true,
"self": 0.012752049136906862,
"children": {
"UnityEnvironment._generate_step_input": {
"total": 0.009736666223034263,
"count": 10,
"is_parallel": true,
"self": 0.009736666223034263
},
"communicator.exchange": {
"total": 0.4049945876467973,
"count": 10,
"is_parallel": true,
"self": 0.4049945876467973
},
"steps_from_proto": {
"total": 0.037343134405091405,
"count": 20,
"is_parallel": true,
"self": 0.007720504887402058,
"children": {
"_process_rank_one_or_two_observation": {
"total": 0.029622629517689347,
"count": 80,
"is_parallel": true,
"self": 0.029622629517689347
}
}
}
}
}
}
},
"steps_from_proto": {
"total": 63.20921622682363,
"count": 23968,
"is_parallel": true,
"self": 10.96054931380786,
"children": {
"_process_rank_one_or_two_observation": {
"total": 52.24866691301577,
"count": 95872,
"is_parallel": true,
"self": 52.24866691301577
}
}
},
"UnityEnvironment.step": {
"total": 243302.29731735843,
"count": 11061929,
"is_parallel": true,
"self": 16865.871614304837,
"children": {
"UnityEnvironment._generate_step_input": {
"total": 10229.591617493192,
"count": 11061929,
"is_parallel": true,
"self": 10229.591617493192
},
"communicator.exchange": {
"total": 170588.07838961575,
"count": 11061929,
"is_parallel": true,
"self": 170588.07838961575
},
"steps_from_proto": {
"total": 45618.75569594465,
"count": 22123858,
"is_parallel": true,
"self": 8546.25141385477,
"children": {
"_process_rank_one_or_two_observation": {
"total": 37072.50428208988,
"count": 88495432,
"is_parallel": true,
"self": 37072.50428208988
}
}
}
}
},
"TrainerController.start_learning": {
"total": 0.0,
"count": 0,
"is_parallel": true,
"self": 0.0,
"children": {
"TrainerController._reset_env": {
"total": 765.6606953628361,
"count": 2576,
"is_parallel": true,
"self": 765.6606953628361
},
"TrainerController.advance": {
"total": 553472.6433439851,
"count": 3113472,
"is_parallel": true,
"self": 127.54399403184652,
"children": {
"env_step": {
"total": 312836.9059403762,
"count": 3113472,
"is_parallel": true,
"self": 104029.15610423265,
"children": {
"SubprocessEnvManager._take_step": {
"total": 208505.66601867974,
"count": 37653456,
"is_parallel": true,
"self": 5868.197185412049,
"children": {
"TorchPolicy.evaluate": {
"total": 202637.4688332677,
"count": 69410080,
"is_parallel": true,
"self": 202637.4688332677
}
}
},
"workers": {
"total": 301.0074671693146,
"count": 3113472,
"is_parallel": true,
"self": 0.0,
"children": {
"worker_root": {
"total": 8863163.5911063,
"count": 37643536,
"is_parallel": true,
"self": 8047015.4603802115,
"children": {
"run_training.setup": {
"total": 0.0,
"count": 0,
"is_parallel": true,
"self": 0.0,
"children": {
"steps_from_proto": {
"total": 0.8267943151295185,
"count": 320,
"is_parallel": true,
"self": 0.20013794675469398,
"children": {
"_process_rank_one_or_two_observation": {
"total": 0.6266563683748245,
"count": 1280,
"is_parallel": true,
"self": 0.6266563683748245
}
}
},
"UnityEnvironment.step": {
"total": 7.437222998589277,
"count": 160,
"is_parallel": true,
"self": 0.2040327861905098,
"children": {
"UnityEnvironment._generate_step_input": {
"total": 0.1557866595685482,
"count": 160,
"is_parallel": true,
"self": 0.1557866595685482
},
"communicator.exchange": {
"total": 6.479913402348757,
"count": 160,
"is_parallel": true,
"self": 6.479913402348757
},
"steps_from_proto": {
"total": 0.5974901504814625,
"count": 320,
"is_parallel": true,
"self": 0.12352807819843292,
"children": {
"_process_rank_one_or_two_observation": {
"total": 0.47396207228302956,
"count": 1280,
"is_parallel": true,
"self": 0.47396207228302956
}
}
}
}
}
}
},
"steps_from_proto": {
"total": 189.85917573422194,
"count": 81920,
"is_parallel": true,
"self": 32.98321542516351,
"children": {
"_process_rank_one_or_two_observation": {
"total": 156.87596030905843,
"count": 327680,
"is_parallel": true,
"self": 156.87596030905843
}
}
},
"UnityEnvironment.step": {
"total": 815958.2715503536,
"count": 37643376,
"is_parallel": true,
"self": 50899.1951662004,
"children": {
"UnityEnvironment._generate_step_input": {
"total": 34107.74587376788,
"count": 37643376,
"is_parallel": true,
"self": 34107.74587376788
},
"communicator.exchange": {
"total": 584456.3526424319,
"count": 37643376,
"is_parallel": true,
"self": 584456.3526424319
},
"steps_from_proto": {
"total": 146494.97786795348,
"count": 75286752,
"is_parallel": true,
"self": 28645.180666983128,
"children": {
"_process_rank_one_or_two_observation": {
"total": 117849.79720097035,
"count": 301147008,
"is_parallel": true,
"self": 117849.79720097035
}
}
}
}
}
}
}
}
},
"steps_from_proto": {
"total": 0.13184957904741168,
"count": 32,
"is_parallel": true,
"self": 0.023764571640640497,
"children": {
"_process_rank_one_or_two_observation": {
"total": 0.10808500740677118,
"count": 128,
"is_parallel": true,
"self": 0.10808500740677118
}
}
},
"UnityEnvironment.step": {
"total": 0.9445007154718041,
"count": 16,
"is_parallel": true,
"self": 0.08671622956171632,
"children": {
"UnityEnvironment._generate_step_input": {
"total": 0.033300156239420176,
"count": 16,
"is_parallel": true,
"self": 0.033300156239420176
},
"communicator.exchange": {
"total": 0.6965830507688224,
"count": 16,
"is_parallel": true,
"self": 0.6965830507688224
},
"steps_from_proto": {
"total": 0.12790127890184522,
"count": 32,
"is_parallel": true,
"self": 0.016938731539994478,
"children": {
"_process_rank_one_or_two_observation": {
"total": 0.11096254736185074,
"count": 128,
"is_parallel": true,
"self": 0.11096254736185074
}
}
}
}
}
}
},
"trainer_advance": {
"total": 240508.193409577,
"count": 3113472,
"is_parallel": true,
"self": 4416.851860079914,
"children": {
"process_trajectory": {
"total": 98595.71652773768,
"count": 3113472,
"is_parallel": true,
"self": 98254.31838959828,
"children": {
"RLTrainer._checkpoint": {
"total": 341.3981381393969,
"count": 1008,
"is_parallel": true,
"self": 341.3981381393969
}
}
},
"_update_policy": {
"total": 137495.62502175942,
"count": 24656,
"is_parallel": true,
"self": 92660.20954589918,
"children": {
"TorchPOCAOptimizer.update": {
"total": 44835.41547586024,
"count": 739680,
"is_parallel": true,
"self": 44835.41547586024
}
}
}
}
}
}
}
}
}
}
}
}
}
}
},
"trainer_advance": {
"total": 92358.61832087347,
"count": 889082,
"self": 1729.3800815341529,
"children": {
"process_trajectory": {
"total": 39200.872351852246,
"count": 889082,
"self": 39080.471363719786,
"children": {
"RLTrainer._checkpoint": {
"total": 120.40098813246004,
"count": 300,
"self": 120.40098813246004
}
}
},
"_update_policy": {
"total": 51428.365887487074,
"count": 7245,
"self": 35151.995161822764,
"children": {
"TorchPOCAOptimizer.update": {
"total": 16276.37072566431,
"count": 217350,
"self": 16276.37072566431
}
}
}
}
}
}
},
"trainer_threads": {
"total": 1.4849938452243805e-06,
"count": 1,
"self": 1.4849938452243805e-06
},
"TrainerController._save_models": {
"total": 0.4543167073279619,
"count": 1,
"self": 0.0035243132151663303,
"children": {
"RLTrainer._checkpoint": {
"total": 0.4507923941127956,
"count": 1,
"self": 0.4507923941127956
}
}
}
}
}
}
}