First Commit

043e64d about 2 years ago

46.1 kB

	{
	"name": "root",
	"gauges": {
	"SoccerTwos.Policy.Entropy.mean": {
	"value": 0.866117000579834,
	"min": 0.8086401224136353,
	"max": 2.135493516921997,
	"count": 14989
	},
	"SoccerTwos.Policy.Entropy.sum": {
	"value": 18708.126953125,
	"min": 10466.740234375,
	"max": 105615.1484375,
	"count": 14989
	},
	"SoccerTwos.Environment.EpisodeLength.mean": {
	"value": 66.29166666666667,
	"min": 26.98324022346369,
	"max": 125.325,
	"count": 14989
	},
	"SoccerTwos.Environment.EpisodeLength.sum": {
	"value": 19092.0,
	"min": 14712.0,
	"max": 22936.0,
	"count": 14989
	},
	"SoccerTwos.Self-play.ELO.mean": {
	"value": 1707.7936415009024,
	"min": 1549.168502889312,
	"max": 1746.4515803198233,
	"count": 14989
	},
	"SoccerTwos.Self-play.ELO.sum": {
	"value": 245922.28437612994,
	"min": 120430.73786124286,
	"max": 605872.0984318862,
	"count": 14989
	},
	"SoccerTwos.Step.mean": {
	"value": 199999964.0,
	"min": 50119986.0,
	"max": 199999964.0,
	"count": 14989
	},
	"SoccerTwos.Step.sum": {
	"value": 199999964.0,
	"min": 50119986.0,
	"max": 199999964.0,
	"count": 14989
	},
	"SoccerTwos.Policy.ExtrinsicBaselineEstimate.mean": {
	"value": -0.04558149352669716,
	"min": -0.16296879947185516,
	"max": 0.10279054194688797,
	"count": 14989
	},
	"SoccerTwos.Policy.ExtrinsicBaselineEstimate.sum": {
	"value": -6.700479507446289,
	"min": -33.77891540527344,
	"max": 16.427635192871094,
	"count": 14989
	},
	"SoccerTwos.Policy.ExtrinsicValueEstimate.mean": {
	"value": -0.04524017497897148,
	"min": -0.16307416558265686,
	"max": 0.10262896120548248,
	"count": 14989
	},
	"SoccerTwos.Policy.ExtrinsicValueEstimate.sum": {
	"value": -6.65030574798584,
	"min": -34.11742401123047,
	"max": 16.870479583740234,
	"count": 14989
	},
	"SoccerTwos.Environment.CumulativeReward.mean": {
	"value": 0.0,
	"min": 0.0,
	"max": 0.0,
	"count": 14989
	},
	"SoccerTwos.Environment.CumulativeReward.sum": {
	"value": 0.0,
	"min": 0.0,
	"max": 0.0,
	"count": 14989
	},
	"SoccerTwos.Policy.ExtrinsicReward.mean": {
	"value": -0.17092517241328753,
	"min": -0.47276239211742693,
	"max": 0.5691900824712328,
	"count": 14989
	},
	"SoccerTwos.Policy.ExtrinsicReward.sum": {
	"value": -25.126000344753265,
	"min": -87.17599999904633,
	"max": 83.58380001783371,
	"count": 14989
	},
	"SoccerTwos.Environment.GroupCumulativeReward.mean": {
	"value": -0.17092517241328753,
	"min": -0.47276239211742693,
	"max": 0.5691900824712328,
	"count": 14989
	},
	"SoccerTwos.Environment.GroupCumulativeReward.sum": {
	"value": -25.126000344753265,
	"min": -87.17599999904633,
	"max": 83.58380001783371,
	"count": 14989
	},
	"SoccerTwos.IsTraining.mean": {
	"value": 1.0,
	"min": 1.0,
	"max": 1.0,
	"count": 14989
	},
	"SoccerTwos.IsTraining.sum": {
	"value": 1.0,
	"min": 1.0,
	"max": 1.0,
	"count": 14989
	},
	"SoccerTwos.Losses.PolicyLoss.mean": {
	"value": 0.018238363913648453,
	"min": 0.008571711436282688,
	"max": 0.026601446373388172,
	"count": 7245
	},
	"SoccerTwos.Losses.PolicyLoss.sum": {
	"value": 0.018238363913648453,
	"min": 0.008571711436282688,
	"max": 0.026601446373388172,
	"count": 7245
	},
	"SoccerTwos.Losses.ValueLoss.mean": {
	"value": 0.09880388751626015,
	"min": 0.06719134338200092,
	"max": 0.15229609956343967,
	"count": 7245
	},
	"SoccerTwos.Losses.ValueLoss.sum": {
	"value": 0.09880388751626015,
	"min": 0.06719134338200092,
	"max": 0.15229609956343967,
	"count": 7245
	},
	"SoccerTwos.Losses.BaselineLoss.mean": {
	"value": 0.09918721541762351,
	"min": 0.06746410404642424,
	"max": 0.15259439150492352,
	"count": 7245
	},
	"SoccerTwos.Losses.BaselineLoss.sum": {
	"value": 0.09918721541762351,
	"min": 0.06746410404642424,
	"max": 0.15259439150492352,
	"count": 7245
	},
	"SoccerTwos.Policy.LearningRate.mean": {
	"value": 6.048997025493988e-09,
	"min": 6.048997025493988e-09,
	"max": 0.0001498667620666315,
	"count": 7245
	},
	"SoccerTwos.Policy.LearningRate.sum": {
	"value": 6.048997025493988e-09,
	"min": 6.048997025493988e-09,
	"max": 0.0001498667620666315,
	"count": 7245
	},
	"SoccerTwos.Policy.Epsilon.mean": {
	"value": 0.20000000000000007,
	"min": 0.20000000000000007,
	"max": 0.20000000000000007,
	"count": 7245
	},
	"SoccerTwos.Policy.Epsilon.sum": {
	"value": 0.20000000000000007,
	"min": 0.20000000000000007,
	"max": 0.20000000000000007,
	"count": 7245
	},
	"SoccerTwos.Policy.Beta.mean": {
	"value": 1.0297152549999698e-05,
	"min": 1.0297152549999698e-05,
	"max": 0.00749584351315,
	"count": 7245
	},
	"SoccerTwos.Policy.Beta.sum": {
	"value": 1.0297152549999698e-05,
	"min": 1.0297152549999698e-05,
	"max": 0.00749584351315,
	"count": 7245
	}
	},
	"metadata": {
	"timer_format_version": "0.1.0",
	"start_time_seconds": "1681458589",
	"python_version": "3.9.16 (main, Mar 8 2023, 14:00:05) \n[GCC 11.2.0]",
	"command_line_arguments": "/data/qyh/env/ml-agents/bin/mlagents-learn ./results/configuration.yaml",
	"mlagents_version": "0.31.0.dev0",
	"mlagents_envs_version": "0.31.0.dev0",
	"communication_protocol_version": "1.5.0",
	"pytorch_version": "1.11.0+cu102",
	"numpy_version": "1.21.2",
	"end_time_seconds": "1681660711"
	},
	"total": 202121.95327740815,
	"count": 1,
	"self": 0.7371731949970126,
	"children": {
	"run_training.setup": {
	"total": 0.08580901497043669,
	"count": 1,
	"self": 0.08580901497043669
	},
	"TrainerController.start_learning": {
	"total": 202121.13029519818,
	"count": 1,
	"self": 75.58960591861978,
	"children": {
	"TrainerController._reset_env": {
	"total": 239.88585016061552,
	"count": 750,
	"self": 239.88585016061552
	},
	"TrainerController.advance": {
	"total": 201805.20052092662,
	"count": 889082,
	"self": 43.436931712087244,
	"children": {
	"env_step": {
	"total": 109403.14526834106,
	"count": 889082,
	"self": 35718.75220445846,
	"children": {
	"SubprocessEnvManager._take_step": {
	"total": 73588.09211776033,
	"count": 11064486,
	"self": 1956.4829019042663,
	"children": {
	"TorchPolicy.evaluate": {
	"total": 71631.60921585606,
	"count": 20304662,
	"self": 71631.60921585606
	}
	}
	},
	"workers": {
	"total": 96.30094612226821,
	"count": 889082,
	"self": 0.0,
	"children": {
	"worker_root": {
	"total": 3786373.531351197,
	"count": 11061955,
	"is_parallel": true,
	"self": 3543006.6518733725,
	"children": {
	"run_training.setup": {
	"total": 1.372944239526987,
	"count": 16,
	"is_parallel": true,
	"self": 0.8564431574195623,
	"children": {
	"steps_from_proto": {
	"total": 0.05167464469559491,
	"count": 20,
	"is_parallel": true,
	"self": 0.012508621672168374,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 0.03916602302342653,
	"count": 80,
	"is_parallel": true,
	"self": 0.03916602302342653
	}
	}
	},
	"UnityEnvironment.step": {
	"total": 0.46482643741182983,
	"count": 10,
	"is_parallel": true,
	"self": 0.012752049136906862,
	"children": {
	"UnityEnvironment._generate_step_input": {
	"total": 0.009736666223034263,
	"count": 10,
	"is_parallel": true,
	"self": 0.009736666223034263
	},
	"communicator.exchange": {
	"total": 0.4049945876467973,
	"count": 10,
	"is_parallel": true,
	"self": 0.4049945876467973
	},
	"steps_from_proto": {
	"total": 0.037343134405091405,
	"count": 20,
	"is_parallel": true,
	"self": 0.007720504887402058,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 0.029622629517689347,
	"count": 80,
	"is_parallel": true,
	"self": 0.029622629517689347
	}
	}
	}
	}
	}
	}
	},
	"steps_from_proto": {
	"total": 63.20921622682363,
	"count": 23968,
	"is_parallel": true,
	"self": 10.96054931380786,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 52.24866691301577,
	"count": 95872,
	"is_parallel": true,
	"self": 52.24866691301577
	}
	}
	},
	"UnityEnvironment.step": {
	"total": 243302.29731735843,
	"count": 11061929,
	"is_parallel": true,
	"self": 16865.871614304837,
	"children": {
	"UnityEnvironment._generate_step_input": {
	"total": 10229.591617493192,
	"count": 11061929,
	"is_parallel": true,
	"self": 10229.591617493192
	},
	"communicator.exchange": {
	"total": 170588.07838961575,
	"count": 11061929,
	"is_parallel": true,
	"self": 170588.07838961575
	},
	"steps_from_proto": {
	"total": 45618.75569594465,
	"count": 22123858,
	"is_parallel": true,
	"self": 8546.25141385477,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 37072.50428208988,
	"count": 88495432,
	"is_parallel": true,
	"self": 37072.50428208988
	}
	}
	}
	}
	},
	"TrainerController.start_learning": {
	"total": 0.0,
	"count": 0,
	"is_parallel": true,
	"self": 0.0,
	"children": {
	"TrainerController._reset_env": {
	"total": 765.6606953628361,
	"count": 2576,
	"is_parallel": true,
	"self": 765.6606953628361
	},
	"TrainerController.advance": {
	"total": 553472.6433439851,
	"count": 3113472,
	"is_parallel": true,
	"self": 127.54399403184652,
	"children": {
	"env_step": {
	"total": 312836.9059403762,
	"count": 3113472,
	"is_parallel": true,
	"self": 104029.15610423265,
	"children": {
	"SubprocessEnvManager._take_step": {
	"total": 208505.66601867974,
	"count": 37653456,
	"is_parallel": true,
	"self": 5868.197185412049,
	"children": {
	"TorchPolicy.evaluate": {
	"total": 202637.4688332677,
	"count": 69410080,
	"is_parallel": true,
	"self": 202637.4688332677
	}
	}
	},
	"workers": {
	"total": 301.0074671693146,
	"count": 3113472,
	"is_parallel": true,
	"self": 0.0,
	"children": {
	"worker_root": {
	"total": 8863163.5911063,
	"count": 37643536,
	"is_parallel": true,
	"self": 8047015.4603802115,
	"children": {
	"run_training.setup": {
	"total": 0.0,
	"count": 0,
	"is_parallel": true,
	"self": 0.0,
	"children": {
	"steps_from_proto": {
	"total": 0.8267943151295185,
	"count": 320,
	"is_parallel": true,
	"self": 0.20013794675469398,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 0.6266563683748245,
	"count": 1280,
	"is_parallel": true,
	"self": 0.6266563683748245
	}
	}
	},
	"UnityEnvironment.step": {
	"total": 7.437222998589277,
	"count": 160,
	"is_parallel": true,
	"self": 0.2040327861905098,
	"children": {
	"UnityEnvironment._generate_step_input": {
	"total": 0.1557866595685482,
	"count": 160,
	"is_parallel": true,
	"self": 0.1557866595685482
	},
	"communicator.exchange": {
	"total": 6.479913402348757,
	"count": 160,
	"is_parallel": true,
	"self": 6.479913402348757
	},
	"steps_from_proto": {
	"total": 0.5974901504814625,
	"count": 320,
	"is_parallel": true,
	"self": 0.12352807819843292,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 0.47396207228302956,
	"count": 1280,
	"is_parallel": true,
	"self": 0.47396207228302956
	}
	}
	}
	}
	}
	}
	},
	"steps_from_proto": {
	"total": 189.85917573422194,
	"count": 81920,
	"is_parallel": true,
	"self": 32.98321542516351,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 156.87596030905843,
	"count": 327680,
	"is_parallel": true,
	"self": 156.87596030905843
	}
	}
	},
	"UnityEnvironment.step": {
	"total": 815958.2715503536,
	"count": 37643376,
	"is_parallel": true,
	"self": 50899.1951662004,
	"children": {
	"UnityEnvironment._generate_step_input": {
	"total": 34107.74587376788,
	"count": 37643376,
	"is_parallel": true,
	"self": 34107.74587376788
	},
	"communicator.exchange": {
	"total": 584456.3526424319,
	"count": 37643376,
	"is_parallel": true,
	"self": 584456.3526424319
	},
	"steps_from_proto": {
	"total": 146494.97786795348,
	"count": 75286752,
	"is_parallel": true,
	"self": 28645.180666983128,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 117849.79720097035,
	"count": 301147008,
	"is_parallel": true,
	"self": 117849.79720097035
	}
	}
	}
	}
	}
	}
	}
	}
	},
	"steps_from_proto": {
	"total": 0.13184957904741168,
	"count": 32,
	"is_parallel": true,
	"self": 0.023764571640640497,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 0.10808500740677118,
	"count": 128,
	"is_parallel": true,
	"self": 0.10808500740677118
	}
	}
	},
	"UnityEnvironment.step": {
	"total": 0.9445007154718041,
	"count": 16,
	"is_parallel": true,
	"self": 0.08671622956171632,
	"children": {
	"UnityEnvironment._generate_step_input": {
	"total": 0.033300156239420176,
	"count": 16,
	"is_parallel": true,
	"self": 0.033300156239420176
	},
	"communicator.exchange": {
	"total": 0.6965830507688224,
	"count": 16,
	"is_parallel": true,
	"self": 0.6965830507688224
	},
	"steps_from_proto": {
	"total": 0.12790127890184522,
	"count": 32,
	"is_parallel": true,
	"self": 0.016938731539994478,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 0.11096254736185074,
	"count": 128,
	"is_parallel": true,
	"self": 0.11096254736185074
	}
	}
	}
	}
	}
	}
	},
	"trainer_advance": {
	"total": 240508.193409577,
	"count": 3113472,
	"is_parallel": true,
	"self": 4416.851860079914,
	"children": {
	"process_trajectory": {
	"total": 98595.71652773768,
	"count": 3113472,
	"is_parallel": true,
	"self": 98254.31838959828,
	"children": {
	"RLTrainer._checkpoint": {
	"total": 341.3981381393969,
	"count": 1008,
	"is_parallel": true,
	"self": 341.3981381393969
	}
	}
	},
	"_update_policy": {
	"total": 137495.62502175942,
	"count": 24656,
	"is_parallel": true,
	"self": 92660.20954589918,
	"children": {
	"TorchPOCAOptimizer.update": {
	"total": 44835.41547586024,
	"count": 739680,
	"is_parallel": true,
	"self": 44835.41547586024
	}
	}
	}
	}
	}
	}
	}
	}
	}
	}
	}
	}
	}
	}
	},
	"trainer_advance": {
	"total": 92358.61832087347,
	"count": 889082,
	"self": 1729.3800815341529,
	"children": {
	"process_trajectory": {
	"total": 39200.872351852246,
	"count": 889082,
	"self": 39080.471363719786,
	"children": {
	"RLTrainer._checkpoint": {
	"total": 120.40098813246004,
	"count": 300,
	"self": 120.40098813246004
	}
	}
	},
	"_update_policy": {
	"total": 51428.365887487074,
	"count": 7245,
	"self": 35151.995161822764,
	"children": {
	"TorchPOCAOptimizer.update": {
	"total": 16276.37072566431,
	"count": 217350,
	"self": 16276.37072566431
	}
	}
	}
	}
	}
	}
	},
	"trainer_threads": {
	"total": 1.4849938452243805e-06,
	"count": 1,
	"self": 1.4849938452243805e-06
	},
	"TrainerController._save_models": {
	"total": 0.4543167073279619,
	"count": 1,
	"self": 0.0035243132151663303,
	"children": {
	"RLTrainer._checkpoint": {
	"total": 0.4507923941127956,
	"count": 1,
	"self": 0.4507923941127956
	}
	}
	}
	}
	}
	}
	}